Merge main

Browse files

Files changed (4) hide show

LICENSE +1 -1
README.md +7 -7
modeling_chatglm.py +3 -3
tokenization_chatglm.py +77 -91

LICENSE CHANGED Viewed

@@ -45,7 +45,7 @@ The glm-4-9b License
 2. License
-Subject to the terms and conditions of this License, Licensor hereby grants you a non-exclusive, worldwide, irrevocable, non-sublicensable, revocable, photo-free copyright license.
 This license allows you to use all open source models in this repository for free for academic research. For users who wish to use the models for commercial purposes, please do so [here](https://open.bigmodel.cn/mla/form)
 Complete registration. Registered users are free to use this model for commercial activities, but must comply with all terms and conditions of this license.
 The copyright notice and this license notice shall be included in all copies or substantial portions of the Software.

 2. License
+Under the terms and conditions of this license, the Licensor hereby grants you a non-exclusive, worldwide, non-transferable, non-sublicensable, revocable, royalty-free copyright license.
 This license allows you to use all open source models in this repository for free for academic research. For users who wish to use the models for commercial purposes, please do so [here](https://open.bigmodel.cn/mla/form)
 Complete registration. Registered users are free to use this model for commercial activities, but must comply with all terms and conditions of this license.
 The copyright notice and this license notice shall be included in all copies or substantial portions of the Software.

README.md CHANGED Viewed

@@ -2,15 +2,15 @@
 license: other
 license_name: glm-4
 license_link: https://huggingface.co/THUDM/glm-4-9b-chat/blob/main/LICENSE
 language:
-  - zh
-  - en
 tags:
-  - glm
-  - chatglm
-  - thudm
 inference: false
 ---
 # GLM-4-9B-Chat
@@ -168,4 +168,4 @@ GLM-4 模型的权重的使用则需要遵循 [LICENSE](LICENSE)。
   pages={320--335},
   year={2022}
 }
-```

 license: other
 license_name: glm-4
 license_link: https://huggingface.co/THUDM/glm-4-9b-chat/blob/main/LICENSE
 language:
+- zh
+- en
 tags:
+- glm
+- chatglm
+- thudm
 inference: false
+pipeline_tag: text-generation
 ---
 # GLM-4-9B-Chat
   pages={320--335},
   year={2022}
 }
+```

modeling_chatglm.py CHANGED Viewed

@@ -21,7 +21,7 @@ from transformers.modeling_outputs import (
     SequenceClassifierOutputWithPast,
 )
 from transformers.modeling_utils import PreTrainedModel
-from transformers.utils import logging
 from transformers.generation.logits_process import LogitsProcessor
 from transformers.generation.utils import LogitsProcessorList, StoppingCriteriaList, GenerationConfig, ModelOutput
@@ -29,7 +29,7 @@ from .configuration_chatglm import ChatGLMConfig
 # flags required to enable jit fusion kernels
-if sys.platform != 'darwin':
     torch._C._jit_set_profiling_mode(False)
     torch._C._jit_set_profiling_executor(False)
     torch._C._jit_override_can_fuse_on_cpu(True)
@@ -1139,7 +1139,7 @@ class ChatGLMForSequenceClassification(ChatGLMPreTrainedModel):
         self.num_labels = config.num_labels
         self.transformer = ChatGLMModel(config, empty_init=empty_init, device=device)
-        self.classifier_head = nn.Linear(config.hidden_size, config.num_labels, bias=True, dtype=torch.half)
         if config.classifier_dropout is not None:
             self.dropout = nn.Dropout(config.classifier_dropout)
         else:

     SequenceClassifierOutputWithPast,
 )
 from transformers.modeling_utils import PreTrainedModel
+from transformers.utils import logging, is_torch_npu_available
 from transformers.generation.logits_process import LogitsProcessor
 from transformers.generation.utils import LogitsProcessorList, StoppingCriteriaList, GenerationConfig, ModelOutput
 # flags required to enable jit fusion kernels
+if sys.platform != 'darwin' and not is_torch_npu_available():
     torch._C._jit_set_profiling_mode(False)
     torch._C._jit_set_profiling_executor(False)
     torch._C._jit_override_can_fuse_on_cpu(True)
         self.num_labels = config.num_labels
         self.transformer = ChatGLMModel(config, empty_init=empty_init, device=device)
+        self.classifier_head = nn.Linear(config.hidden_size, config.num_labels, bias=True, dtype=config.torch_dtype)
         if config.classifier_dropout is not None:
             self.dropout = nn.Dropout(config.classifier_dropout)
         else:

tokenization_chatglm.py CHANGED Viewed

@@ -130,6 +130,8 @@ class ChatGLM4Tokenizer(PreTrainedTokenizer):
         prefix_tokens = [self.convert_tokens_to_ids("[gMASK]"), self.convert_tokens_to_ids("<sop>")]
         return prefix_tokens
     def build_single_message(self, role, metadata, message, tokenize=True):
         assert role in ["system", "user", "assistant", "observation"], role
         if tokenize:
@@ -142,97 +144,81 @@ class ChatGLM4Tokenizer(PreTrainedTokenizer):
             return str(f"<|{role}|>{metadata}\n{message}")
-    # def apply_chat_template(
-    #         self,
-    #         conversation: Union[List[Dict[str, str]], List[List[Dict[str, str]]], "Conversation"],
-    #         add_generation_prompt: bool = False,
-    #         tokenize: bool = True,
-    #         padding: bool = False,
-    #         truncation: bool = False,
-    #         max_length: Optional[int] = None,
-    #         return_tensors: Optional[Union[str, TensorType]] = None,
-    #         return_dict: bool = False,
-    #         tokenizer_kwargs: Optional[Dict[str, Any]] = None,
-    #         add_special_tokens: bool = True,
-    #         **kwargs,
-    # ) -> Union[str, List[int], List[str], List[List[int]], BatchEncoding]:
-    #     if return_dict and not tokenize:
-    #         raise ValueError(
-    #             "`return_dict=True` is incompatible with `tokenize=False`, because there is no dict "
-    #             "of tokenizer outputs to return."
-    #         )
-    #     def handle_single_conversation(conversation):
-    #         input_ids = self.get_prefix_tokens() if add_special_tokens else []
-    #         input_message = "[gMASK]<sop>" if add_special_tokens else ""
-    #         for item in conversation:
-    #             if item.get("tools"):
-    #                 tools = item["tools"]
-    #                 content = "你是一个名为 GLM-4 的人工智能助手。你是基于智谱AI训练的语言模型 GLM-4 模型开发的，你的任务是针对用户的问题和要求提供适当的答复和支持。"
-    #                 for tool in tools:
-    #                     if tool["type"] == "function":
-    #                         function = tool["function"]
-    #                         content += f"\n\n## {function['name']}\n\n{json.dumps(function, ensure_ascii=False, indent=4)}"
-    #                         content += "\n在调用上述函数时，请使用 Json 格式表示调用的参数。"
-    #                     elif tool["type"] == "python":
-    #                         content += "\n\n## python\n\n当你向 `python` 发送包含 Python 代码的消息时，该代码将会在一个有状态的 Jupyter notebook 环境中执行。\n`python` 返回代码执行的输出，或在执行 60 秒后返回超时。\n`/mnt/data` 将会持久化存储你的文件。在此会话中，`python` 无法访问互联网。不要使用 `python` 进行任何网络请求或者在线 API 调用，这些在线内容的访问将不会成功。"
-    #                     elif tool["type"] == "simple_browser":
-    #                         content += "\n\n## simple_browser\n\n你可以使用 `simple_browser` 工具。该工具支持以下函数：\n`search(query: str, recency_days: int)`：使用搜索引擎进行查询并显示结果，可以使用 `recency_days` 参数控制搜索内容的时效性。\n`mclick(ids: list[int])`：获取一系列指定 id 的页面内容。每次调用时，须选择3-10个页面。选择多个角度的页面，同时尽可能选择可信任的信息来源。考虑到部分页面是无法加载的，你也可以多打开一些可能有用的页面而不用担心内容过多。\n`open_url(url: str)`：打开指定的 URL。\n\n使用 `【{引用 id}†{引用文本}】` 来引用内容。\n\n操作步骤：1. 使用 `search` 来获得信息列表; 2. 使用 `mclick` 来获取指定 ID 页面的内容; 3. 根据获得的内容进行回复。在回复中应当引用信息来源。\n 如果用户提供了 URL，也可以用 `open_url` 直接打开页面。\n如果初次搜索结果没有找到合适的信息，也可以再次使用 `search` 进行搜索。"
-    #                     elif tool["type"] == "cogview":
-    #                         content += "\n\n## cogview\n\n如果用户的请求中包含了对图像的描述，你可以使用 `cogview` 来生成图像并展示给用户。你需要向 `cogview` 发送图像描述，规则：\n- 发送给 `cogview` 的消息必须使用英语。用户的中文描述必须完全翻译为英语。\n- 应当尽可能详细地描述图像生成的需求，需求描述约 100 英文单词。\n- 保持用户原始描述的意图。不要虚构内容或者没见过的人物。\n- 如无特殊说明，所在地为中国，持有中国立场并遵循中国社会主义价值观。"
-    #                     else:
-    #                         raise NotImplementedError(f"Unknown tool type {tool['type']}")
-    #                 input = self.build_single_message("system", "", content, tokenize=tokenize)
-    #                 if tokenize:
-    #                     input_ids.extend(input)
-    #                 else:
-    #                     input_message += input
-    #             if item["content"]:
-    #                 input = self.build_single_message(
-    #                     item["role"],
-    #                     item.get("metadata", ""),
-    #                     item["content"],
-    #                     tokenize=tokenize
-    #                 )
-    #                 if tokenize:
-    #                     input_ids.extend(input)
-    #                 else:
-    #                     input_message += input
-    #         if add_generation_prompt:
-    #             if tokenize:
-    #                 input_ids.extend([self.convert_tokens_to_ids("<|assistant|>")])
-    #             else:
-    #                 input_message += "<|assistant|>"
-    #         return input_ids if tokenize else input_message
-    #     # Main logic to handle different conversation formats
-    #     if isinstance(conversation, list) and all(isinstance(i, dict) for i in conversation):
-    #         result = handle_single_conversation(conversation)
-    #     elif isinstance(conversation, list) and all(isinstance(i, list) for i in conversation):
-    #         result = [handle_single_conversation(c) for c in conversation]
-    #     elif hasattr(conversation, "messages"):
-    #         result = handle_single_conversation(conversation.messages)
-    #     else:
-    #         raise ValueError("Invalid conversation format")
-    #     if tokenize:
-    #         output = self.batch_encode_plus(
-    #             [result] if isinstance(result[0], int) else result,
-    #             padding=padding,
-    #             truncation=truncation,
-    #             max_length=max_length,
-    #             return_tensors=return_tensors,
-    #             is_split_into_words=True,
-    #             add_special_tokens=False
-    #         )
-    #         if return_dict:
-    #             return output
-    #         else:
-    #             return output["input_ids"]
-    #     else:
-    #         return result
     def build_inputs_with_special_tokens(

         prefix_tokens = [self.convert_tokens_to_ids("[gMASK]"), self.convert_tokens_to_ids("<sop>")]
         return prefix_tokens
+    """ use chat_template, no need apply_chat_template
     def build_single_message(self, role, metadata, message, tokenize=True):
         assert role in ["system", "user", "assistant", "observation"], role
         if tokenize:
             return str(f"<|{role}|>{metadata}\n{message}")
+    def apply_chat_template(
+            self,
+            conversation: Union[List[Dict[str, str]], List[List[Dict[str, str]]], "Conversation"],
+            add_generation_prompt: bool = False,
+            tokenize: bool = True,
+            padding: bool = False,
+            truncation: bool = False,
+            max_length: Optional[int] = None,
+            return_tensors: Optional[Union[str, TensorType]] = None,
+            return_dict: bool = False,
+            tokenizer_kwargs: Optional[Dict[str, Any]] = None,
+            add_special_tokens: bool = True,
+            **kwargs,
+    ) -> Union[str, List[int], List[str], List[List[int]], BatchEncoding]:
+        if return_dict and not tokenize:
+            raise ValueError(
+                "`return_dict=True` is incompatible with `tokenize=False`, because there is no dict "
+                "of tokenizer outputs to return."
+            )
+        def handle_single_conversation(conversation):
+            input_ids = self.get_prefix_tokens() if add_special_tokens else []
+            input_message = "[gMASK]<sop>" if add_special_tokens else ""
+            for item in conversation:
+                if item.get("tools"):
+                    tools = item["tools"]
+                    content = "你是一个名为 GhatGLM 的人工智能助手。你是基于智谱AI训练的语言模型 GLM-4 模型开发的，你的任务是针对用户的问题和要求提供适当的答复和支持。"
+                    content += "\n\n# 可用工具"
+                    for tool in tools:
+                        if tool["type"] == "function":
+                            function = tool["function"]
+                            content += f"\n\n## {function['name']}\n\n{json.dumps(function, ensure_ascii=False, indent=4)}"
+                            content += "\n在调用上述函数时，请使用 Json 格式表示调用的参数。"
+                        elif tool["type"] == "python":
+                            content += "\n\n## python\n\n当你向 `python` 发送包含 Python 代码的消息时，该代码将会在一个有状态的 Jupyter notebook 环境中执行。\n`python` 返回代码执行的输出，或在执行 60 秒后返回超时。\n`/mnt/data` 将会持久化存储你的文件。在此会话中，`python` 无法访问互联网。不要使用 `python` 进行任何网络请求或者在线 API 调用，这些在线内容的访问将不会成功。"
+                        elif tool["type"] == "simple_browser":
+                            content += "\n\n## simple_browser\n\n你可以使用 `simple_browser` 工具。该工具支持以下函数：\n`search(query: str, recency_days: int)`：使用搜索引擎进行查询并显示结果，可以使用 `recency_days` 参数控制搜索内容的时效性。\n`mclick(ids: list[int])`：获取一系列指定 id 的页面内容。每次调用时，须选择3-10个页面。选择多个角度的页面，同时尽可能选择可信任的信息来源。考虑到部分页面是无法加载的，你也可以多打开一些可能有用的页面而不用担心内容过多。\n`open_url(url: str)`：打开指定的 URL。\n\n使用 `【{引用 id}†{引用文本}】` 来引用内容。\n\n操作步骤：1. 使用 `search` 来获得信息列表; 2. 使用 `mclick` 来获取指定 ID 页面的内容; 3. 根据获得的内容进行回复。在回复中应当引用信息来源。\n 如果用户提供了 URL，也可以用 `open_url` 直接打开页面。\n如果初次搜索结果没有找到合适的信息，也可以再次使用 `search` 进行搜索。"
+                        elif tool["type"] == "cogview":
+                            content += "\n\n## cogview\n\n如果用户的请求中包含了对图像的描述，你可以使用 `cogview` 来生成图像并展示给用户。你需要向 `cogview` 发送图像描述，规则：\n- 发送给 `cogview` 的消息必须使用英语。用户的中文描述必须完全翻译为英语。\n- 应当尽可能详细地描述图像生成的需求，需求描述约 100 英文单词。\n- 保持用户原始描述的意图。不要虚构内容或者没见过的人物。\n- 如无特殊说明，所在地为中国，持有中国立场并遵循中国社会主义价值观。"
+                        else:
+                            raise NotImplementedError(f"Unknown tool type {tool['type']}")
+                    input = self.build_single_message("system", "", content, tokenize=tokenize)
+                    if tokenize:
+                        input_ids.extend(input)
+                    else:
+                        input_message += input
+                if item["content"]:
+                    input = self.build_single_message(
+                        item["role"],
+                        item.get("metadata", ""),
+                        item["content"],
+                        tokenize=tokenize
+                    )
+                    if tokenize:
+                        input_ids.extend(input)
+                    else:
+                        input_message += input
+            if add_generation_prompt:
+                if tokenize:
+                    input_ids.extend([self.convert_tokens_to_ids("<|assistant|>")])
+                else:
+                    input_message += "<|assistant|>"
+            return input_ids if tokenize else input_message
+        # Main logic to handle different conversation formats
+        if isinstance(conversation, list) and all(isinstance(i, dict) for i in conversation):
+            result = handle_single_conversation(conversation)
+        elif isinstance(conversation, list) and all(isinstance(i, list) for i in conversation):
+            result = [handle_single_conversation(c) for c in conversation]
+        elif hasattr(conversation, "messages"):
+            result = handle_single_conversation(conversation.messages)
+        else:
+            raise ValueError("Invalid conversation format")
+    """
     def build_inputs_with_special_tokens(