Merge branch 'main' of https://huggingface.co/THUDM/glm-4-9b-chat

Files changed (4) hide show

LICENSE CHANGED Viewed

@@ -45,7 +45,7 @@ The glm-4-9b License
 2. License
-Subject to the terms and conditions of this License, Licensor hereby grants you a non-exclusive, worldwide, irrevocable, non-sublicensable, revocable, photo-free copyright license.
 This license allows you to use all open source models in this repository for free for academic research. For users who wish to use the models for commercial purposes, please do so [here](https://open.bigmodel.cn/mla/form)
 Complete registration. Registered users are free to use this model for commercial activities, but must comply with all terms and conditions of this license.
 The copyright notice and this license notice shall be included in all copies or substantial portions of the Software.

 2. License
+Under the terms and conditions of this license, the Licensor hereby grants you a non-exclusive, worldwide, non-transferable, non-sublicensable, revocable, royalty-free copyright license.
 This license allows you to use all open source models in this repository for free for academic research. For users who wish to use the models for commercial purposes, please do so [here](https://open.bigmodel.cn/mla/form)
 Complete registration. Registered users are free to use this model for commercial activities, but must comply with all terms and conditions of this license.
 The copyright notice and this license notice shall be included in all copies or substantial portions of the Software.

README.md CHANGED Viewed

@@ -2,15 +2,15 @@
 license: other
 license_name: glm-4
 license_link: https://huggingface.co/THUDM/glm-4-9b-chat/blob/main/LICENSE
 language:
-  - zh
-  - en
 tags:
-  - glm
-  - chatglm
-  - thudm
 inference: false
 ---
 # GLM-4-9B-Chat
@@ -168,4 +168,4 @@ GLM-4 模型的权重的使用则需要遵循 [LICENSE](LICENSE)。
   pages={320--335},
   year={2022}
 }
-```

 license: other
 license_name: glm-4
 license_link: https://huggingface.co/THUDM/glm-4-9b-chat/blob/main/LICENSE
 language:
+- zh
+- en
 tags:
+- glm
+- chatglm
+- thudm
 inference: false
+pipeline_tag: text-generation
 ---
 # GLM-4-9B-Chat
   pages={320--335},
   year={2022}
 }
+```

modeling_chatglm.py CHANGED Viewed

@@ -21,7 +21,7 @@ from transformers.modeling_outputs import (
     SequenceClassifierOutputWithPast,
 )
 from transformers.modeling_utils import PreTrainedModel
-from transformers.utils import logging
 from transformers.generation.logits_process import LogitsProcessor
 from transformers.generation.utils import LogitsProcessorList, StoppingCriteriaList, GenerationConfig, ModelOutput
@@ -29,7 +29,7 @@ from .configuration_chatglm import ChatGLMConfig
 # flags required to enable jit fusion kernels
-if sys.platform != 'darwin':
     torch._C._jit_set_profiling_mode(False)
     torch._C._jit_set_profiling_executor(False)
     torch._C._jit_override_can_fuse_on_cpu(True)

     SequenceClassifierOutputWithPast,
 )
 from transformers.modeling_utils import PreTrainedModel
+from transformers.utils import logging, is_torch_npu_available
 from transformers.generation.logits_process import LogitsProcessor
 from transformers.generation.utils import LogitsProcessorList, StoppingCriteriaList, GenerationConfig, ModelOutput
 # flags required to enable jit fusion kernels
+if sys.platform != 'darwin' and not is_torch_npu_available():
     torch._C._jit_set_profiling_mode(False)
     torch._C._jit_set_profiling_executor(False)
     torch._C._jit_override_can_fuse_on_cpu(True)

tokenization_chatglm.py CHANGED Viewed

@@ -63,22 +63,22 @@ class ChatGLM4Tokenizer(PreTrainedTokenizer):
         vocab.update(self.added_tokens_encoder)
         return vocab
-    def convert_tokens_to_string(self, tokens: List[Union[bytes, str]]) -> str:
         """
         Converts a sequence of tokens in a single string.
         """
         text = ""
         temp = b""
         for t in tokens:
             if isinstance(t, str):
                 if temp:
                     text += temp.decode("utf-8", errors="replace")
-                    temp = b""
-                text += t
             elif isinstance(t, bytes):
                 temp += t
             else:
-                raise TypeError("token should only be of type types or str")
         if temp:
             text += temp.decode("utf-8", errors="replace")
         return text

         vocab.update(self.added_tokens_encoder)
         return vocab
+    def convert_tokens_to_string(self, tokens: List[Union[bytes, str, int]]) -> str:
         """
         Converts a sequence of tokens in a single string.
         """
         text = ""
         temp = b""
         for t in tokens:
+            if isinstance(t, int):
+                t = chr(t)
             if isinstance(t, str):
                 if temp:
                     text += temp.decode("utf-8", errors="replace")
             elif isinstance(t, bytes):
                 temp += t
             else:
+                raise TypeError("token should only be of type int, bytes or str")
         if temp:
             text += temp.decode("utf-8", errors="replace")
         return text