Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- merges.txt +0 -0
- mlc-chat-config.json +85 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,85 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen3",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 5120,
|
8 |
+
"intermediate_size": 17408,
|
9 |
+
"attention_bias": false,
|
10 |
+
"num_attention_heads": 40,
|
11 |
+
"num_hidden_layers": 40,
|
12 |
+
"num_key_value_heads": 8,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"rope_theta": 1000000,
|
15 |
+
"vocab_size": 151936,
|
16 |
+
"tie_word_embeddings": false,
|
17 |
+
"context_window_size": 40960,
|
18 |
+
"prefill_chunk_size": 2048,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"head_dim": 128,
|
21 |
+
"dtype": "float32",
|
22 |
+
"max_batch_size": 128
|
23 |
+
},
|
24 |
+
"vocab_size": 151936,
|
25 |
+
"context_window_size": 40960,
|
26 |
+
"sliding_window_size": -1,
|
27 |
+
"prefill_chunk_size": 2048,
|
28 |
+
"attention_sink_size": -1,
|
29 |
+
"tensor_parallel_shards": 1,
|
30 |
+
"pipeline_parallel_stages": 1,
|
31 |
+
"temperature": 0.6,
|
32 |
+
"presence_penalty": 0.0,
|
33 |
+
"frequency_penalty": 0.0,
|
34 |
+
"repetition_penalty": 1.0,
|
35 |
+
"top_p": 0.95,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"vocab.json",
|
39 |
+
"merges.txt",
|
40 |
+
"tokenizer_config.json"
|
41 |
+
],
|
42 |
+
"tokenizer_info": {
|
43 |
+
"token_postproc_method": "byte_level",
|
44 |
+
"prepend_space_in_encode": false,
|
45 |
+
"strip_space_in_decode": false
|
46 |
+
},
|
47 |
+
"conv_template": {
|
48 |
+
"name": "qwen2",
|
49 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
50 |
+
"system_message": "You are a helpful assistant.",
|
51 |
+
"system_prefix_token_ids": null,
|
52 |
+
"add_role_after_system_message": true,
|
53 |
+
"roles": {
|
54 |
+
"user": "<|im_start|>user",
|
55 |
+
"assistant": "<|im_start|>assistant"
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
"<|im_end|>\n"
|
65 |
+
],
|
66 |
+
"role_content_sep": "\n",
|
67 |
+
"role_empty_sep": "\n",
|
68 |
+
"stop_str": [
|
69 |
+
"<|endoftext|>",
|
70 |
+
"<|im_end|>"
|
71 |
+
],
|
72 |
+
"stop_token_ids": [
|
73 |
+
151643,
|
74 |
+
151645
|
75 |
+
],
|
76 |
+
"function_string": "",
|
77 |
+
"use_function_calling": false
|
78 |
+
},
|
79 |
+
"pad_token_id": 151643,
|
80 |
+
"bos_token_id": 151643,
|
81 |
+
"eos_token_id": [
|
82 |
+
151645,
|
83 |
+
151643
|
84 |
+
]
|
85 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:843bac9acc3333302ec1687358f5a20b2df2010f3700efc1ddc640147e2a3f54
|
3 |
+
size 388956160
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e57af34f8b90d3adf045a33ea70fd0b3ce504bbbad11944645d386f61d0fc68
|
3 |
+
size 48619520
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b97ef0a5a5a0f3d028ce4e7236d39182ba83e2ccb09a67166ba911585fa336c
|
3 |
+
size 44564480
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70ba25ff81add02cbe68ae702e4764f7cacda5ee373889c5b3e336913f163497
|
3 |
+
size 44564480
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7aad04c24ab5e675aadc24bc340c5c850a049725529ee3e7c321af2c6bd97f5
|
3 |
+
size 89128960
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c79509c8f84755d78855fc9c2b01972e9e44ed9f12fd28807926d62e13cea9c
|
3 |
+
size 18350080
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32958e437c2860f65f02052e8de60bb8966436ea7a7bd34f50855ca91e46e70d
|
3 |
+
size 31478272
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6d350b5cf65f0856fe78ba2e017ff9c2676ae891faa97dbec9bb26bcf9a2200
|
3 |
+
size 44564480
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f53ff3b6cee46e79256bbb77bea402fee928579cb3b9f5ca8b42d9569e44209
|
3 |
+
size 89128960
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f31017de7148a3d3cc34022fc3c124908f8796b7c47301ee92e5a14d5539edc0
|
3 |
+
size 22620416
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dd23bb0d7bf0aff8afaf94e2bb970d3846b8b7a42c9d0ed24e154c0d1832718
|
3 |
+
size 31795456
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:952a03f52eabace881d4aee6a93271cb9a1d6f96385286120ea794d0a997b5d0
|
3 |
+
size 44564480
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5caa9cfc1b96e295fb29c68227f89a248527fb698fe0c18fe7902e48ef2b80b
|
3 |
+
size 89128960
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:963eca975e3c5ab1eaef719b6365b81d4a4aa3ecaa627818cfdc6da6cb36d0ed
|
3 |
+
size 89128960
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ff724e8da5839645f89cceeb1c1b89a8031f2de2e1e29d2dac331e86432b928
|
3 |
+
size 18350080
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca0cf836e5f9e631e890a6c3808bfbbfcafba822e6c5ee69500b0af84e558695
|
3 |
+
size 31478272
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70b55e43e85994df57850ab4d068127da4d35bcf7f74c22bca2063235fa72594
|
3 |
+
size 44564480
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed01119b0d61e39d471d58351fe59515bdd577a07f6c95f98ba8fa5d0b5da2e4
|
3 |
+
size 89128960
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bead2def6d06f2b424e3e2962ddc5ccaf4d25931edad73fddb77ca3ce67c5bf4
|
3 |
+
size 22620416
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64b10a7793bfeb857df39b0aaf53ba559252408f1f1b81caa0d2c3efe063a956
|
3 |
+
size 31795456
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:752b1d6b4a3b5eff4f332ad55d37c9b38e1c8d199850cab53b4910ea855790ae
|
3 |
+
size 89128960
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd50b860a1961d3fbcfeba39a8d16339537351dc63d6202339af8c332bd6aa5c
|
3 |
+
size 18350080
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7e90871f05415b2418b5c50f4d8f9ab1748b51a6282f5e9e06d160dc2f14f06
|
3 |
+
size 28180992
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96961026bf6083bcd494a5b086ddcd88730b956ad599246c4ed55d2456d96789
|
3 |
+
size 44564480
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:786d6b6936c7c2adc56570f17f038138a772cc72f9c9edc1033bad0c881c3666
|
3 |
+
size 22620416
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:329e2187fe4048163f42905a5ac21aeddde3855a4a6ec7d06b077d970841e78a
|
3 |
+
size 44564480
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:537ccb4b4c075597856ba5d94f5e97ebbdbec50b8f2f84d73d2808091e448610
|
3 |
+
size 89128960
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:973e3646fa312993ce92847173bbba4cb61895b7d84e1973714c2952ee3a487a
|
3 |
+
size 25917696
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0afd019999e3a638c694096b43dcaf26cf599f957f4c22862913f40ad4f1f9f8
|
3 |
+
size 31795456
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f65f45e26e7a2af94dc2f4059f05fa13fcc36984109d81f91cff83c45b01a0d
|
3 |
+
size 44564480
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbc9cec0c5342b8b2bb4afac51630df1b78564564eac3ff40d68082443f102c8
|
3 |
+
size 89128960
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d8f51775c93a997e1beeecbb161451bad19dd84f33f49f75d99da78d9472935
|
3 |
+
size 18350080
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:218acd3d945779823f6854f09e1b7bd636ff4b05c19ac44cb91cf747c662ffd4
|
3 |
+
size 31478272
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e29018b0d66629caa530234798087720f25bc1e68afd2d91c03fbf502935fba
|
3 |
+
size 44564480
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7e928af79cc4aa7a693e2329e8b09d167bbb44e7efa24f02a8c60d5981e0c21
|
3 |
+
size 89128960
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45000d14d5f10ce9bfb7f21968d9613077b3512df128ce920c059559ed46f98f
|
3 |
+
size 31795456
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e8dfea49fdcbf25995426f95a19d3748491f779e829f86edd363db06c480c53
|
3 |
+
size 22620416
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a59bb41a388ce2b7d3aa4ac178c42be80e00123be99ee54866d28e952326595
|
3 |
+
size 31795456
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cb1dbd0cb26b53675e77f0600acba2f2cfba2afefca9b3df5edbefceaf2a929
|
3 |
+
size 44564480
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fb270558a597fb4c26d8786db86c76a5591c926c43225a7f2da43aaa474a55f
|
3 |
+
size 89128960
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fe22bdb8cbf52d29502ee2f09411ea63b638044d2fb851496b08db34692b911
|
3 |
+
size 18350080
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa2619466ef604a1ed9cd10a8da3848ceb0c0317bdc127bd5966c22dd02d6abf
|
3 |
+
size 31478272
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2978165a9388fb98d5b1b7365ec1b6d4ae1975a1bc0ea9eeab333256bac9f011
|
3 |
+
size 44564480
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89ece6dcb7d501730a5c1c8f398eda4f46e8ec1db1a883724ad347191786768d
|
3 |
+
size 89128960
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:405df3b0e5aad34ba09cc486488a3d9d88197d2298ca5cb332ffbd37f6dd9a7c
|
3 |
+
size 22620416
|