riczhou commited on
Commit
06c924a
·
verified ·
1 Parent(s): 4109bbb

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 5120,
8
+ "intermediate_size": 17408,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 40,
11
+ "num_hidden_layers": 40,
12
+ "num_key_value_heads": 8,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": false,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128
23
+ },
24
+ "vocab_size": 151936,
25
+ "context_window_size": 40960,
26
+ "sliding_window_size": -1,
27
+ "prefill_chunk_size": 2048,
28
+ "attention_sink_size": -1,
29
+ "tensor_parallel_shards": 1,
30
+ "pipeline_parallel_stages": 1,
31
+ "temperature": 0.6,
32
+ "presence_penalty": 0.0,
33
+ "frequency_penalty": 0.0,
34
+ "repetition_penalty": 1.0,
35
+ "top_p": 0.95,
36
+ "tokenizer_files": [
37
+ "tokenizer.json",
38
+ "vocab.json",
39
+ "merges.txt",
40
+ "tokenizer_config.json"
41
+ ],
42
+ "tokenizer_info": {
43
+ "token_postproc_method": "byte_level",
44
+ "prepend_space_in_encode": false,
45
+ "strip_space_in_decode": false
46
+ },
47
+ "conv_template": {
48
+ "name": "qwen2",
49
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
+ "system_message": "You are a helpful assistant.",
51
+ "system_prefix_token_ids": null,
52
+ "add_role_after_system_message": true,
53
+ "roles": {
54
+ "user": "<|im_start|>user",
55
+ "assistant": "<|im_start|>assistant"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ "<|im_end|>\n"
65
+ ],
66
+ "role_content_sep": "\n",
67
+ "role_empty_sep": "\n",
68
+ "stop_str": [
69
+ "<|endoftext|>",
70
+ "<|im_end|>"
71
+ ],
72
+ "stop_token_ids": [
73
+ 151643,
74
+ 151645
75
+ ],
76
+ "function_string": "",
77
+ "use_function_calling": false
78
+ },
79
+ "pad_token_id": 151643,
80
+ "bos_token_id": 151643,
81
+ "eos_token_id": [
82
+ 151645,
83
+ 151643
84
+ ]
85
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a6fba7021e507e1da0a94ee43225dc88ad4425289f80c224ced97b016e481df
3
+ size 388956160
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a2249d4edc224f40fffd34d3f9d9cfdbc9abfbc9ea596c7ae34d33bb68f1174
3
+ size 48619520
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d81051c5a7395141b33b9180ac84fb2241d74a8e5e48c7159afacfd4af04dfce
3
+ size 44564480
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44cbebf1021087c8001196ee6bd37f54cb275c8ae9b8213a3953d467691e31fa
3
+ size 44564480
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1339f5f41c9442f0ceef286b47d236fd6196447754bd6c4bbd0726fabbf20996
3
+ size 89128960
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1030584da3c8d31afedc416ae5c24c55c3555ddfe9defc324b6121da59b88a1
3
+ size 18350080
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c827c728ca1e7095d7e617a50e97abf811426d7b55051f6ce4b8f14617ab680d
3
+ size 31478272
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81fae19a3a99db67a96e8f9895f82a5a6523183a4421a348fe91c9e8be5090d0
3
+ size 44564480
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:213abec8d7ac007942ffa15d281841de758587e64242c5e1ec9d33a7febe51ce
3
+ size 89128960
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:675b87c80888f9b51a2c0f513bb026cbc1f9ecbfb50a79e5f330d8785da87a8c
3
+ size 22620416
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b26ab2e2f2e67f7cb822e650aaf97f608d0ba923f31e26ecbfb9c4aff445691
3
+ size 31795456
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4016eebfb120f7e62b3e4257f38300c01f7eb86426d39dab047a1b81f83e84e
3
+ size 44564480
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d298cbf94e3a53a41cb58ae07899a3994cf296341bddf886aee086a151b3b7d5
3
+ size 89128960
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b708811c2f748422fddcca0174745ca47e4f665797d2b4598e4430553b8e950
3
+ size 89128960
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0050091c00a5502ab73960b44923856ddc71847d65df7240149ab5e27143097b
3
+ size 18350080
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a292aa8181a2581511db812e47068251b2c72dcb4a0b19eb6b2c964393a7fd00
3
+ size 31478272
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2213746c10b6b1445e594bce6aa487ac34e35d6d0006f48e7652dcde1e69e07
3
+ size 44564480
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93620041a0ebbbcde5c10c6f6c289b4af88278308226115f022a5b6b37529916
3
+ size 89128960
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:424d8ec96d2d199002bf1d33c9512a373e046f6106d7c4cbbf2d6dc364065658
3
+ size 22620416
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0be1da608055d9f75253ea2b35d60b7c3c94f6cabca5a3e08cdb86769c9990
3
+ size 31795456
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:929aac7820696e8a3a1abc9385363daa21512dd06e915f088e0377a8e47aadbb
3
+ size 89128960
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63a4a879b42e4b1c6fd2a3527d68db432a934908bdfcbbef920520d3086529ce
3
+ size 18350080
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ae1e6db3d940467dff27b954a32262582893721e7696e3bd34b6c8714023ed4
3
+ size 28180992
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f540c3b865c4fc0fa877a381ed8b9b3469638e4edf74bb6ded9d3a7208cee6a
3
+ size 44564480
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9660f1374217489e3f711aaea2963a4eabf6e4165a58fe3850ce05b9aa2d8036
3
+ size 22620416
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a445a447073f4f51bc6c110a68e12d83d79736700e77ce2c714f792b03670d2e
3
+ size 44564480
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c741772b9ffa53c170eb57410514574f85977b9e51d46b346a4ee19b36add842
3
+ size 89128960
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e21958d0b5843adee0e0e2a1240064966dfa1a9297ddf29bf39510483059ac50
3
+ size 25917696
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77422a86b7407a5c517381e993283146e84e7fbdd7e0a29ccfa389667d2a9e20
3
+ size 31795456
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:247af123fb51777d12788a6337f22b4d92888674f7c4c35d19c80e854e77bc54
3
+ size 44564480
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36ac578a7c942015fd3ccab7a057517841012d9d141de65d303f4fa0abb73bc4
3
+ size 89128960
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:369159aee4c54d00ef70fec32b06e7b3bc70d65a70377891bf43d764e8edd683
3
+ size 18350080
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:371cf250a0bf4b60f12f1862e7f55e1f235b3b7ce6e0728ec2d53b067a1cf717
3
+ size 31478272
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db66a2b761ea75606f1e1f396b45b367ea67aa33819e70afefb72aa5b0662db0
3
+ size 44564480
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c99ce9f18413eb5e4ea186c00b1b680740d0348b080d8fdeb38fbcb1b0a6bffd
3
+ size 89128960
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdeed54c36b0153e1417f067bc430455537b8b966d1127dc5595ff5a943f5c64
3
+ size 31795456
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a108ec091739bdb18aeb44c1567ebe21c64bc5f4751169511ca6c96f454370a
3
+ size 22620416
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f395220f490406d8a7165b2d70ca062ea0fc7903e65622dbc5d1444ca397bda
3
+ size 31795456
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5253659327ef430dc01694ce4b01c40731ca979503625549fbb2ee825f24868
3
+ size 44564480
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a8450f6af8d0617566a1732321be77e8eee2ae42c538e1bbe0fb0044982a512
3
+ size 89128960
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fc37758ca05cd9fa8dc31d45f7c5092078eb2d7c2889223954de64df298c110
3
+ size 18350080
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfabe31fc2607ce647d638bfc1fe83de1bc441f3cde7d59fac592f87057b8de3
3
+ size 31478272
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b40a47ad0699330db5890910486910e532048135bf502acc05e6113938e3efae
3
+ size 44564480
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa32c2d69e76f7286aba6689ba8ca1cf2f65a78b4f2bfb24a76ac2d667bd258e
3
+ size 89128960
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3332a34601c08fe151c486943e13e482b060b2a701ab00d5d7af97cadfe87a9
3
+ size 22620416
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5973e48a88da356f950f8d22c0d7308ff0e50243d37ddfb5b6c345ff843ee167
3
+ size 31795456