Upload folder using huggingface_hub

Files changed (9) hide show

config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "_name_or_path": "/mnt/step2-alignment-jfs/zane/opensources_model/Qwen2.5-32B",
   "architectures": [
     "Qwen2ForCausalLM"
   ],
@@ -11,19 +10,18 @@
   "initializer_range": 0.02,
   "intermediate_size": 27648,
   "max_position_embeddings": 131072,
-  "max_window_layers": 64,
   "model_type": "qwen2",
   "num_attention_heads": 40,
   "num_hidden_layers": 64,
   "num_key_value_heads": 8,
   "rms_norm_eps": 1e-05,
-  "rope_scaling": null,
   "rope_theta": 1000000.0,
-  "sliding_window": null,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.46.1",
-  "use_cache": false,
   "use_sliding_window": false,
   "vocab_size": 152064
-}

 {
   "architectures": [
     "Qwen2ForCausalLM"
   ],
   "initializer_range": 0.02,
   "intermediate_size": 27648,
   "max_position_embeddings": 131072,
+  "max_window_layers": 70,
   "model_type": "qwen2",
   "num_attention_heads": 40,
   "num_hidden_layers": 64,
   "num_key_value_heads": 8,
   "rms_norm_eps": 1e-05,
   "rope_theta": 1000000.0,
+  "sliding_window": 131072,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.43.1",
+  "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 152064
+}

model-00001-of-00005.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:72752bbdb84b52de8953ecb5bed6be0fb4b972f56431aab85c4319d9846a2beb
+size 12813971088

model-00002-of-00005.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3f8c0c9c632673ed4ce42162be30cb11ee04edd21cfee4225f94837743050de4
+size 13705416016

model-00003-of-00005.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b826ad70084614aac514f686575bada6069f610e76af8a914e5b0f99494429f
+size 14219197672

model-00004-of-00005.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e4d8d033ed89f21f618bf52f507c58330fb91e1ee39615a9a8c05d73835013d
+size 13936082040

model-00005-of-00005.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8a2cb250c065bc2f86d8530b163b9c782d3a7fef2ec9a4ec1e5756501e34e5a
+size 10853174920

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
-size 11421896

 version https://git-lfs.github.com/spec/v1
+oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf
+size 7031673

tokenizer_config.json CHANGED Viewed

@@ -195,7 +195,7 @@
     "<|video_pad|>"
   ],
   "bos_token": null,
-  "chat_template": "{{ bos_token }}A conversation between User and Assistant. The User asks a question, and the Assistant solves it. The Assistant first thinks about the reasoning process in the mind and then provides the User with the answer. The reasoning process is enclosed within <think> </think> and answer is enclosed within <answer> </answer> tags, respectively, i.e., <think> reasoning process here </think> <answer> answer here </answer>. {% for message in messages %}{% if message['role'] == 'user' %}User: You must put your answer inside <answer> </answer> tags, i.e., <answer> answer here </answer>. And your final answer will be extracted automatically by the \\boxed{} tag.\nThis is the problem:\n{{ message['content'] }}\n{% elif message['role'] == 'assistant' %}Assistant: <think>{{ message['content'] }}</answer>\n{% endif %}{% endfor %}{% if add_generation_prompt %}Assistant: <think>{% endif %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|endoftext|>",
   "errors": "replace",

     "<|video_pad|>"
   ],
   "bos_token": null,
+  "chat_template": "{%- if messages[0]['role'] == 'system' %}\n    {{- messages[0]['content'] }}\n{%- else %}\n    {{- 'A conversation between User and Assistant. The User asks a question, and the Assistant solves it. The Assistant first thinks about the reasoning process in the mind and then provides the User with the answer. The reasoning process is enclosed within <think> </think> and answer is enclosed within <answer> </answer> tags, respectively, i.e., <think> reasoning process here </think> <answer> answer here </answer>. ' }}\n{%- endif %}\n{%- for message in messages %}\n    {%- if (message.role == \"user\") %}\n        {{- 'User: ' + message.content + '\\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- 'Assistant: <think>' + message.content + '\\n' }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- 'Assistant: <think>' }}\n{%- endif %}\n",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|endoftext|>",
   "errors": "replace",