riczhou commited on
Commit
b30a281
·
verified ·
1 Parent(s): 2943235

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3",
4
+ "quantization": "q4f32_1",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 5120,
8
+ "intermediate_size": 17408,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 40,
11
+ "num_hidden_layers": 40,
12
+ "num_key_value_heads": 8,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": false,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128
23
+ },
24
+ "vocab_size": 151936,
25
+ "context_window_size": 40960,
26
+ "sliding_window_size": -1,
27
+ "prefill_chunk_size": 2048,
28
+ "attention_sink_size": -1,
29
+ "tensor_parallel_shards": 1,
30
+ "pipeline_parallel_stages": 1,
31
+ "temperature": 0.6,
32
+ "presence_penalty": 0.0,
33
+ "frequency_penalty": 0.0,
34
+ "repetition_penalty": 1.0,
35
+ "top_p": 0.95,
36
+ "tokenizer_files": [
37
+ "tokenizer.json",
38
+ "vocab.json",
39
+ "merges.txt",
40
+ "tokenizer_config.json"
41
+ ],
42
+ "tokenizer_info": {
43
+ "token_postproc_method": "byte_level",
44
+ "prepend_space_in_encode": false,
45
+ "strip_space_in_decode": false
46
+ },
47
+ "conv_template": {
48
+ "name": "qwen2",
49
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
+ "system_message": "You are a helpful assistant.",
51
+ "system_prefix_token_ids": null,
52
+ "add_role_after_system_message": true,
53
+ "roles": {
54
+ "user": "<|im_start|>user",
55
+ "assistant": "<|im_start|>assistant"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ "<|im_end|>\n"
65
+ ],
66
+ "role_content_sep": "\n",
67
+ "role_empty_sep": "\n",
68
+ "stop_str": [
69
+ "<|endoftext|>",
70
+ "<|im_end|>"
71
+ ],
72
+ "stop_token_ids": [
73
+ 151643,
74
+ 151645
75
+ ],
76
+ "function_string": "",
77
+ "use_function_calling": false
78
+ },
79
+ "pad_token_id": 151643,
80
+ "bos_token_id": 151643,
81
+ "eos_token_id": [
82
+ 151645,
83
+ 151643
84
+ ]
85
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:843bac9acc3333302ec1687358f5a20b2df2010f3700efc1ddc640147e2a3f54
3
+ size 388956160
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e57af34f8b90d3adf045a33ea70fd0b3ce504bbbad11944645d386f61d0fc68
3
+ size 48619520
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b97ef0a5a5a0f3d028ce4e7236d39182ba83e2ccb09a67166ba911585fa336c
3
+ size 44564480
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70ba25ff81add02cbe68ae702e4764f7cacda5ee373889c5b3e336913f163497
3
+ size 44564480
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7aad04c24ab5e675aadc24bc340c5c850a049725529ee3e7c321af2c6bd97f5
3
+ size 89128960
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c79509c8f84755d78855fc9c2b01972e9e44ed9f12fd28807926d62e13cea9c
3
+ size 18350080
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32958e437c2860f65f02052e8de60bb8966436ea7a7bd34f50855ca91e46e70d
3
+ size 31478272
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6d350b5cf65f0856fe78ba2e017ff9c2676ae891faa97dbec9bb26bcf9a2200
3
+ size 44564480
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f53ff3b6cee46e79256bbb77bea402fee928579cb3b9f5ca8b42d9569e44209
3
+ size 89128960
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f31017de7148a3d3cc34022fc3c124908f8796b7c47301ee92e5a14d5539edc0
3
+ size 22620416
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dd23bb0d7bf0aff8afaf94e2bb970d3846b8b7a42c9d0ed24e154c0d1832718
3
+ size 31795456
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952a03f52eabace881d4aee6a93271cb9a1d6f96385286120ea794d0a997b5d0
3
+ size 44564480
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5caa9cfc1b96e295fb29c68227f89a248527fb698fe0c18fe7902e48ef2b80b
3
+ size 89128960
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:963eca975e3c5ab1eaef719b6365b81d4a4aa3ecaa627818cfdc6da6cb36d0ed
3
+ size 89128960
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ff724e8da5839645f89cceeb1c1b89a8031f2de2e1e29d2dac331e86432b928
3
+ size 18350080
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca0cf836e5f9e631e890a6c3808bfbbfcafba822e6c5ee69500b0af84e558695
3
+ size 31478272
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70b55e43e85994df57850ab4d068127da4d35bcf7f74c22bca2063235fa72594
3
+ size 44564480
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed01119b0d61e39d471d58351fe59515bdd577a07f6c95f98ba8fa5d0b5da2e4
3
+ size 89128960
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bead2def6d06f2b424e3e2962ddc5ccaf4d25931edad73fddb77ca3ce67c5bf4
3
+ size 22620416
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b10a7793bfeb857df39b0aaf53ba559252408f1f1b81caa0d2c3efe063a956
3
+ size 31795456
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:752b1d6b4a3b5eff4f332ad55d37c9b38e1c8d199850cab53b4910ea855790ae
3
+ size 89128960
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd50b860a1961d3fbcfeba39a8d16339537351dc63d6202339af8c332bd6aa5c
3
+ size 18350080
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7e90871f05415b2418b5c50f4d8f9ab1748b51a6282f5e9e06d160dc2f14f06
3
+ size 28180992
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96961026bf6083bcd494a5b086ddcd88730b956ad599246c4ed55d2456d96789
3
+ size 44564480
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:786d6b6936c7c2adc56570f17f038138a772cc72f9c9edc1033bad0c881c3666
3
+ size 22620416
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:329e2187fe4048163f42905a5ac21aeddde3855a4a6ec7d06b077d970841e78a
3
+ size 44564480
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:537ccb4b4c075597856ba5d94f5e97ebbdbec50b8f2f84d73d2808091e448610
3
+ size 89128960
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:973e3646fa312993ce92847173bbba4cb61895b7d84e1973714c2952ee3a487a
3
+ size 25917696
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0afd019999e3a638c694096b43dcaf26cf599f957f4c22862913f40ad4f1f9f8
3
+ size 31795456
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f65f45e26e7a2af94dc2f4059f05fa13fcc36984109d81f91cff83c45b01a0d
3
+ size 44564480
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbc9cec0c5342b8b2bb4afac51630df1b78564564eac3ff40d68082443f102c8
3
+ size 89128960
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d8f51775c93a997e1beeecbb161451bad19dd84f33f49f75d99da78d9472935
3
+ size 18350080
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:218acd3d945779823f6854f09e1b7bd636ff4b05c19ac44cb91cf747c662ffd4
3
+ size 31478272
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e29018b0d66629caa530234798087720f25bc1e68afd2d91c03fbf502935fba
3
+ size 44564480
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7e928af79cc4aa7a693e2329e8b09d167bbb44e7efa24f02a8c60d5981e0c21
3
+ size 89128960
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45000d14d5f10ce9bfb7f21968d9613077b3512df128ce920c059559ed46f98f
3
+ size 31795456
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e8dfea49fdcbf25995426f95a19d3748491f779e829f86edd363db06c480c53
3
+ size 22620416
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a59bb41a388ce2b7d3aa4ac178c42be80e00123be99ee54866d28e952326595
3
+ size 31795456
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cb1dbd0cb26b53675e77f0600acba2f2cfba2afefca9b3df5edbefceaf2a929
3
+ size 44564480
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fb270558a597fb4c26d8786db86c76a5591c926c43225a7f2da43aaa474a55f
3
+ size 89128960
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fe22bdb8cbf52d29502ee2f09411ea63b638044d2fb851496b08db34692b911
3
+ size 18350080
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa2619466ef604a1ed9cd10a8da3848ceb0c0317bdc127bd5966c22dd02d6abf
3
+ size 31478272
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2978165a9388fb98d5b1b7365ec1b6d4ae1975a1bc0ea9eeab333256bac9f011
3
+ size 44564480
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89ece6dcb7d501730a5c1c8f398eda4f46e8ec1db1a883724ad347191786768d
3
+ size 89128960
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:405df3b0e5aad34ba09cc486488a3d9d88197d2298ca5cb332ffbd37f6dd9a7c
3
+ size 22620416