Inho Oh commited on
Commit
225b1a3
·
1 Parent(s): 395003d

update to use full fine-tuning

Browse files

Signed-off-by: Inho Oh <[email protected]>

ndarray-cache.json CHANGED
@@ -22,7 +22,7 @@
22
  "byteOffset": 0
23
  }
24
  ],
25
- "md5sum": "493b5641a854a7800c7fa11483aad4f7"
26
  },
27
  {
28
  "dataPath": "params_shard_1.bin",
@@ -373,7 +373,7 @@
373
  "byteOffset": 33169664
374
  }
375
  ],
376
- "md5sum": "497d78221d7a23bd4c5e89f4304ae0bd"
377
  },
378
  {
379
  "dataPath": "params_shard_2.bin",
@@ -842,7 +842,7 @@
842
  "byteOffset": 32989184
843
  }
844
  ],
845
- "md5sum": "e7ff64137eff92c60593a150717a9dcd"
846
  },
847
  {
848
  "dataPath": "params_shard_3.bin",
@@ -1311,7 +1311,7 @@
1311
  "byteOffset": 33051392
1312
  }
1313
  ],
1314
- "md5sum": "0476638568978882217d1c7e293d948e"
1315
  },
1316
  {
1317
  "dataPath": "params_shard_4.bin",
@@ -1760,7 +1760,7 @@
1760
  "byteOffset": 28662784
1761
  }
1762
  ],
1763
- "md5sum": "933a6b65e1d7141d7bd847ad454fc56d"
1764
  },
1765
  {
1766
  "dataPath": "params_shard_5.bin",
@@ -2229,7 +2229,7 @@
2229
  "byteOffset": 28939264
2230
  }
2231
  ],
2232
- "md5sum": "78b5a93295b12ffcba820c0e32eded1d"
2233
  },
2234
  {
2235
  "dataPath": "params_shard_6.bin",
@@ -2698,7 +2698,7 @@
2698
  "byteOffset": 31118336
2699
  }
2700
  ],
2701
- "md5sum": "ea93e8edfbe16d3ffe05cb466f752abc"
2702
  },
2703
  {
2704
  "dataPath": "params_shard_7.bin",
@@ -2931,7 +2931,7 @@
2931
  "byteOffset": 14604032
2932
  }
2933
  ],
2934
- "md5sum": "e2c330e3708ce0442a5cf83730738904"
2935
  }
2936
  ]
2937
  }
 
22
  "byteOffset": 0
23
  }
24
  ],
25
+ "md5sum": "a597e14ea300c8147d9e40af43fec21d"
26
  },
27
  {
28
  "dataPath": "params_shard_1.bin",
 
373
  "byteOffset": 33169664
374
  }
375
  ],
376
+ "md5sum": "719aa0a12714b39727d65fcdaaaa0869"
377
  },
378
  {
379
  "dataPath": "params_shard_2.bin",
 
842
  "byteOffset": 32989184
843
  }
844
  ],
845
+ "md5sum": "59872bb3b80a79849c828d5508227dba"
846
  },
847
  {
848
  "dataPath": "params_shard_3.bin",
 
1311
  "byteOffset": 33051392
1312
  }
1313
  ],
1314
+ "md5sum": "bb4c708ea2d1546633a01c3cf366fa31"
1315
  },
1316
  {
1317
  "dataPath": "params_shard_4.bin",
 
1760
  "byteOffset": 28662784
1761
  }
1762
  ],
1763
+ "md5sum": "98278d4fd0a53b469c05fdfcf79dcb5c"
1764
  },
1765
  {
1766
  "dataPath": "params_shard_5.bin",
 
2229
  "byteOffset": 28939264
2230
  }
2231
  ],
2232
+ "md5sum": "6e0ee62704a9006346886af5aa46dbff"
2233
  },
2234
  {
2235
  "dataPath": "params_shard_6.bin",
 
2698
  "byteOffset": 31118336
2699
  }
2700
  ],
2701
+ "md5sum": "f4f2726f049dfc458c5e86f51a60daae"
2702
  },
2703
  {
2704
  "dataPath": "params_shard_7.bin",
 
2931
  "byteOffset": 14604032
2932
  }
2933
  ],
2934
+ "md5sum": "cf3bf3970dc9bb13089cbe31a6e69f7f"
2935
  }
2936
  ]
2937
  }
params_shard_0.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f309954d310dc63adfaf3ef6aa987c681b8aa6d1b9686aa2525b454b0d058d5
3
  size 68067328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceb1ce049bf3ba6a7f77a4c99002e77d53b2f8b75f9eec77e711bfe732b20b6b
3
  size 68067328
params_shard_1.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f00b1382ec7495799f1304e3ad837186775d1faac641917e9a663471f6951023
3
  size 33234176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32e3560e7a1726d2d58efd2bcb4f3dba590b733945a406f624918ee30c9c7da3
3
  size 33234176
params_shard_2.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae92dc070074ad846c0bb9e6d57b256a621db0976b745b00449b24b726b7f532
3
  size 33505280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bfa3a9ebc16786aefd38c8748138d90d9d433b170214986be3db5f02c4e0a1b
3
  size 33505280
params_shard_3.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc745314a3024dd73f7d1b12f765926f0686d240516580a37689958e18788408
3
  size 33053696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38ab4741405bbbc0279e99e497291295944fcc8116171063072db28845f33fe1
3
  size 33053696
params_shard_4.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2eec019ae20aa3d3cb049f739b76495678fd7498829e04244baaed5a01629da7
3
  size 33020928
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0d9a3f562b72dd715886a7fe3e9bb0dee00f3e1095bb963567af76095e25328
3
  size 33020928
params_shard_5.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30b93aae2307d918ca4f5543b9c412f66b8039cb4f86d8cfa3525eab6ed05cc1
3
  size 29211648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:095d95a5d40d0d5c1a913444ea75f7b446cb0d9476a7e5b9b2ab0030381a0d13
3
  size 29211648
params_shard_6.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4be4486d5051bc7f3215e7bdf918dfc0307c0891a12df5f572660cdeaa3a8c5c
3
  size 33297408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6ba5c306fa44fb465029be15cc8621f0b1676e30b0079364fa1f5c3c8514a71
3
  size 33297408
params_shard_7.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fa0000c8cedeca3065b670f3c68379a93efdf132ef04f35ac1794ea96f5b172
3
  size 14605824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad83aa0f9c68a19aa18d5bb8962c64da0fea9c86c59921066bc2ba050ad2d80f
3
  size 14605824
tokenizer_config.json CHANGED
@@ -197,7 +197,7 @@
197
  "bos_token": null,
198
  "chat_template": "{%- if tools %}\n {{- '<|im_start|>system\\n' }}\n {%- if messages[0]['role'] == 'system' %}\n {{- messages[0]['content'] }}\n {%- else %}\n {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }}\n {%- endif %}\n {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within <tools></tools> XML tags:\\n<tools>\" }}\n {%- for tool in tools %}\n {{- \"\\n\" }}\n {{- tool | tojson }}\n {%- endfor %}\n {{- \"\\n</tools>\\n\\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\\n<tool_call>\\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\\n</tool_call><|im_end|>\\n\" }}\n{%- else %}\n {%- if messages[0]['role'] == 'system' %}\n {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n {%- else %}\n {{- '<|im_start|>system\\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\\n' }}\n {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n {%- elif message.role == \"assistant\" %}\n {{- '<|im_start|>' + message.role }}\n {%- if message.content %}\n {{- '\\n' + message.content }}\n {%- endif %}\n {%- for tool_call in message.tool_calls %}\n {%- if tool_call.function is defined %}\n {%- set tool_call = tool_call.function %}\n {%- endif %}\n {{- '\\n<tool_call>\\n{\"name\": \"' }}\n {{- tool_call.name }}\n {{- '\", \"arguments\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- '}\\n</tool_call>' }}\n {%- endfor %}\n {{- '<|im_end|>\\n' }}\n {%- elif message.role == \"tool\" %}\n {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n {{- '<|im_start|>user' }}\n {%- endif %}\n {{- '\\n<tool_response>\\n' }}\n {{- message.content }}\n {{- '\\n</tool_response>' }}\n {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n {{- '<|im_end|>\\n' }}\n {%- endif %}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n",
199
  "clean_up_tokenization_spaces": false,
200
- "eos_token": "<|endoftext|>",
201
  "errors": "replace",
202
  "extra_special_tokens": {},
203
  "model_max_length": 131072,
 
197
  "bos_token": null,
198
  "chat_template": "{%- if tools %}\n {{- '<|im_start|>system\\n' }}\n {%- if messages[0]['role'] == 'system' %}\n {{- messages[0]['content'] }}\n {%- else %}\n {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }}\n {%- endif %}\n {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within <tools></tools> XML tags:\\n<tools>\" }}\n {%- for tool in tools %}\n {{- \"\\n\" }}\n {{- tool | tojson }}\n {%- endfor %}\n {{- \"\\n</tools>\\n\\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\\n<tool_call>\\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\\n</tool_call><|im_end|>\\n\" }}\n{%- else %}\n {%- if messages[0]['role'] == 'system' %}\n {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n {%- else %}\n {{- '<|im_start|>system\\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\\n' }}\n {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n {%- elif message.role == \"assistant\" %}\n {{- '<|im_start|>' + message.role }}\n {%- if message.content %}\n {{- '\\n' + message.content }}\n {%- endif %}\n {%- for tool_call in message.tool_calls %}\n {%- if tool_call.function is defined %}\n {%- set tool_call = tool_call.function %}\n {%- endif %}\n {{- '\\n<tool_call>\\n{\"name\": \"' }}\n {{- tool_call.name }}\n {{- '\", \"arguments\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- '}\\n</tool_call>' }}\n {%- endfor %}\n {{- '<|im_end|>\\n' }}\n {%- elif message.role == \"tool\" %}\n {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n {{- '<|im_start|>user' }}\n {%- endif %}\n {{- '\\n<tool_response>\\n' }}\n {{- message.content }}\n {{- '\\n</tool_response>' }}\n {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n {{- '<|im_end|>\\n' }}\n {%- endif %}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n",
199
  "clean_up_tokenization_spaces": false,
200
+ "eos_token": "<|im_end|>",
201
  "errors": "replace",
202
  "extra_special_tokens": {},
203
  "model_max_length": 131072,