Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- merges.txt +0 -0
- mlc-chat-config.json +85 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,85 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen3",
|
4 |
+
"quantization": "q4f16_0",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 2560,
|
8 |
+
"intermediate_size": 9728,
|
9 |
+
"attention_bias": false,
|
10 |
+
"num_attention_heads": 32,
|
11 |
+
"num_hidden_layers": 36,
|
12 |
+
"num_key_value_heads": 8,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"rope_theta": 1000000,
|
15 |
+
"vocab_size": 151936,
|
16 |
+
"tie_word_embeddings": true,
|
17 |
+
"context_window_size": 40960,
|
18 |
+
"prefill_chunk_size": 2048,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"head_dim": 128,
|
21 |
+
"dtype": "float32",
|
22 |
+
"max_batch_size": 128
|
23 |
+
},
|
24 |
+
"vocab_size": 151936,
|
25 |
+
"context_window_size": 40960,
|
26 |
+
"sliding_window_size": -1,
|
27 |
+
"prefill_chunk_size": 2048,
|
28 |
+
"attention_sink_size": -1,
|
29 |
+
"tensor_parallel_shards": 1,
|
30 |
+
"pipeline_parallel_stages": 1,
|
31 |
+
"temperature": 0.6,
|
32 |
+
"presence_penalty": 0.0,
|
33 |
+
"frequency_penalty": 0.0,
|
34 |
+
"repetition_penalty": 1.0,
|
35 |
+
"top_p": 0.95,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"vocab.json",
|
39 |
+
"merges.txt",
|
40 |
+
"tokenizer_config.json"
|
41 |
+
],
|
42 |
+
"tokenizer_info": {
|
43 |
+
"token_postproc_method": "byte_level",
|
44 |
+
"prepend_space_in_encode": false,
|
45 |
+
"strip_space_in_decode": false
|
46 |
+
},
|
47 |
+
"conv_template": {
|
48 |
+
"name": "qwen2",
|
49 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
50 |
+
"system_message": "You are a helpful assistant.",
|
51 |
+
"system_prefix_token_ids": null,
|
52 |
+
"add_role_after_system_message": true,
|
53 |
+
"roles": {
|
54 |
+
"user": "<|im_start|>user",
|
55 |
+
"assistant": "<|im_start|>assistant"
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
"<|im_end|>\n"
|
65 |
+
],
|
66 |
+
"role_content_sep": "\n",
|
67 |
+
"role_empty_sep": "\n",
|
68 |
+
"stop_str": [
|
69 |
+
"<|endoftext|>",
|
70 |
+
"<|im_end|>"
|
71 |
+
],
|
72 |
+
"stop_token_ids": [
|
73 |
+
151643,
|
74 |
+
151645
|
75 |
+
],
|
76 |
+
"function_string": "",
|
77 |
+
"use_function_calling": false
|
78 |
+
},
|
79 |
+
"pad_token_id": 151643,
|
80 |
+
"bos_token_id": 151643,
|
81 |
+
"eos_token_id": [
|
82 |
+
151645,
|
83 |
+
151643
|
84 |
+
]
|
85 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:961be4c2aa04bdbe0d7e75ac393765a6c5fa81369c6c0b7c270ee439dafce206
|
3 |
+
size 194478080
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:687cd132c9045469b3936a40c458ab1db313d89298d533030091677a81eb9501
|
3 |
+
size 24314880
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4e261a802228310d2af46ff193aaf0faed4434388901f8df07c13e0c83d76f7
|
3 |
+
size 24903680
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7940d58a99fadd862cbffed3db9aad5b0863a3fac7df3a696df487f82c92b7ff
|
3 |
+
size 31877632
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a14e4147db5d6ddbd708f05fb6058690d219c18d6f57e6e531f91229d3d7321
|
3 |
+
size 24903680
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4427dfb98663a91ce89bb53d235e64c8141936016466ecfe1d2ebfb2add6255
|
3 |
+
size 31877632
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1f9ef46e8948eb7e5774e6967e999ce25ddd17499f6bb82e7d332ee5cc51cfc
|
3 |
+
size 24903680
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74cd2d450183ccc4c8ee2f682c2a6cd5d346da3ecf186ba0724adfb1237ab38b
|
3 |
+
size 24903680
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd5abb04284936e53bfbf33f5d99dcc5c86dfb0a8e3d714f202c22625d930ce5
|
3 |
+
size 31872512
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adb5dbd39dc43815c0087871e514510394bacaf581fdaf4d968b8643e0e72af2
|
3 |
+
size 24903680
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41beb584ff34309518988349b3ad24a2714bf20756ae0f42e016c970ba6b88e6
|
3 |
+
size 31872512
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:613a37d309a6cd284e30b974d50fc320d3ddeb5b555289574686078966d87b67
|
3 |
+
size 24903680
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:194c34bcca50f869b8939153bf7d4e027bcff741334ddc3185262aae58a560db
|
3 |
+
size 24903680
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:642da43f9f2bece90f8912aa79ae66bb137c6cd279a709dc5b3b332354732026
|
3 |
+
size 31877632
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fd2c2ce91c14d28379cbee3d5f4353096ea9366557cbb97a21e7dea7d482bfe
|
3 |
+
size 24903680
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:717947765471fd78fbcc6dcb657c8da50fcdce20492cea847437cd210d289b6a
|
3 |
+
size 31877632
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fda7bb84ed0c00a507e5bb59afe79998485f2efa83a5d60f29b35f508de2405
|
3 |
+
size 24903680
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c92925b9d1154730e82738569dd1022c658a8267c353cb305a6912adfc1f885c
|
3 |
+
size 31877632
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8be2812717e752a50a14fc26c5d4ab0b925371c16ae74f5119c8a4b3fbe8cb5
|
3 |
+
size 24903680
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea297d5255aec243430de6190f2a0de6cb993ed7e272ba3d988ebfcfb40ba49a
|
3 |
+
size 31877632
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99e23a5564168ca6fd4f1ccbca7000df9d07f3bed81ee512b5d3bef4ffe46b5c
|
3 |
+
size 24903680
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3603909089ac65cae7118508d66c558000fbe3948a8ceb3a40112ef04de230a
|
3 |
+
size 31877632
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efccc8176b556e299624306d87fe0ae70cbb588379d7df7b9fba6724cd4fec41
|
3 |
+
size 24903680
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2e3e61ec6412bf5da3ad98a3538dc2db89adccfc313e0b86880d41ef47e8fdf
|
3 |
+
size 31877632
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c228fe35aa1e91138eea239fe1b7dc4e37c9245de082c7269c6aef90b37b6d18
|
3 |
+
size 31877632
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c18d3b1a983a9c64757be9dc6a0fa8cb40632e677a33b990aa362f25422832f
|
3 |
+
size 24903680
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e581671852ee376a1c4aaa33b42bfd1a9cb2a24aac82ec71b1bc7ebd9668d8a
|
3 |
+
size 31877632
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcc476c5f9230c5b22dbef48ca03d7b3b2c60c7a1b27e4ea8bd3e53ffbebe55a
|
3 |
+
size 31887872
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1255f5f04169031f925dc91dee90e305e964a61e40ba35eefcd7004bcb59cc98
|
3 |
+
size 24903680
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f969088ba8a71d89a6fe2cac059343de0e33a3f4d360a630803b3b2fb9db7bd
|
3 |
+
size 31877632
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee8c5c02b6057f004b61d46a8b29a797fdc1c88d5ba6d1a63076ecfa62ef04e9
|
3 |
+
size 24903680
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f34f79a2606edce3916d7be0584b48af4b8606250d239fed2726d2a26ab1952c
|
3 |
+
size 31877632
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12c9b198bd8f4ba08b52d0f1e9134c7576d6a17d5c9fe669f1b2872a54127ae9
|
3 |
+
size 24903680
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86825ace7d47c3de4bd0004040f97f99e16c997d9e49f7d8f92502efecaf9864
|
3 |
+
size 31877632
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d57412abead5c557b7300c26ba2ae4b946ac9e8a7739b320d06acd459897f62
|
3 |
+
size 24903680
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd9b70b9477fbd435b6b1759ff179fb024cd4ccc0b68fbf87bd734da9a5bd020
|
3 |
+
size 24903680
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81643615e63c25cd27e389ff9a819c8f295e6a012b37196b95d408157cd97d33
|
3 |
+
size 31877632
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79c63300829bb82b12e9bd876d89aec169b2bdeb82256d1013da30fb489e8540
|
3 |
+
size 24903680
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54f5e245aa1053e6967a0df7f87d4d8157016052935c2af59730a1eef265949f
|
3 |
+
size 31877632
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9dac0d37b55a22c9a53cd065e59b09623bad09a3550d812baebe545562f9a858
|
3 |
+
size 24903680
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64966462e6b9a78b6ed065749f45b7c2b07f737a8722c40a866a4583d1f4d37e
|
3 |
+
size 31877632
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adf04abc6f78b3a3c15fa6ee6db535495d2858c20c94f28b3ffc11f60d489711
|
3 |
+
size 24903680
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d56bfc80cfe23547bd56b22f419cc57aeab3b96590681b060874b883e95a355
|
3 |
+
size 31877632
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83fc0dc44e1764d2610f47a6fad1b2c1d35e01c2403a60df04891ef976f9cd08
|
3 |
+
size 24903680
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cda0ff337cbea1ad693b9d532782bda9254c9f44282e94215172ef562fd89b66
|
3 |
+
size 31877632
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c76890c56e213ada6b77a3f7940b55c7d488d6084b934452423db31ed7c053ef
|
3 |
+
size 31877632
|