Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- added_tokens.json +3 -0
- mlc-chat-config.json +99 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<image_soft_token>": 262144
|
3 |
+
}
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "gemma3",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"text_config": {
|
7 |
+
"hidden_size": 5376,
|
8 |
+
"intermediate_size": 21504,
|
9 |
+
"num_hidden_layers": 62,
|
10 |
+
"attention_bias": false,
|
11 |
+
"num_attention_heads": 32,
|
12 |
+
"num_key_value_heads": 16,
|
13 |
+
"head_dim": 128,
|
14 |
+
"rms_norm_eps": 1e-06,
|
15 |
+
"hidden_activation": "gelu_pytorch_tanh",
|
16 |
+
"position_embedding_base": 10000,
|
17 |
+
"context_window_size": 8192,
|
18 |
+
"prefill_chunk_size": 8192,
|
19 |
+
"query_pre_attn_scalar": 168,
|
20 |
+
"sliding_window": 1024,
|
21 |
+
"kwargs": {
|
22 |
+
"model_type": "gemma3_text",
|
23 |
+
"rope_scaling": {
|
24 |
+
"factor": 8.0,
|
25 |
+
"rope_type": "linear"
|
26 |
+
}
|
27 |
+
}
|
28 |
+
},
|
29 |
+
"vocab_size": 262208,
|
30 |
+
"tensor_parallel_shards": 1,
|
31 |
+
"max_batch_size": 128,
|
32 |
+
"context_window_size": 8192,
|
33 |
+
"sliding_window_size": -1,
|
34 |
+
"prefill_chunk_size": 8192,
|
35 |
+
"is_text_model": false
|
36 |
+
},
|
37 |
+
"vocab_size": 262208,
|
38 |
+
"context_window_size": 8192,
|
39 |
+
"sliding_window_size": -1,
|
40 |
+
"prefill_chunk_size": 8192,
|
41 |
+
"attention_sink_size": -1,
|
42 |
+
"tensor_parallel_shards": 1,
|
43 |
+
"pipeline_parallel_stages": 1,
|
44 |
+
"temperature": 1.0,
|
45 |
+
"presence_penalty": 0.0,
|
46 |
+
"frequency_penalty": 0.0,
|
47 |
+
"repetition_penalty": 1.0,
|
48 |
+
"top_p": 0.95,
|
49 |
+
"tokenizer_files": [
|
50 |
+
"tokenizer.model",
|
51 |
+
"tokenizer.json",
|
52 |
+
"added_tokens.json",
|
53 |
+
"tokenizer_config.json"
|
54 |
+
],
|
55 |
+
"tokenizer_info": {
|
56 |
+
"token_postproc_method": "byte_fallback",
|
57 |
+
"prepend_space_in_encode": false,
|
58 |
+
"strip_space_in_decode": false
|
59 |
+
},
|
60 |
+
"conv_template": {
|
61 |
+
"name": "gemma_instruction",
|
62 |
+
"system_template": "{system_message}",
|
63 |
+
"system_message": "",
|
64 |
+
"system_prefix_token_ids": [
|
65 |
+
2
|
66 |
+
],
|
67 |
+
"add_role_after_system_message": true,
|
68 |
+
"roles": {
|
69 |
+
"user": "<start_of_turn>user",
|
70 |
+
"assistant": "<start_of_turn>model"
|
71 |
+
},
|
72 |
+
"role_templates": {
|
73 |
+
"user": "{user_message}",
|
74 |
+
"assistant": "{assistant_message}",
|
75 |
+
"tool": "{tool_message}"
|
76 |
+
},
|
77 |
+
"messages": [],
|
78 |
+
"seps": [
|
79 |
+
"<end_of_turn>\n"
|
80 |
+
],
|
81 |
+
"role_content_sep": "\n",
|
82 |
+
"role_empty_sep": "\n",
|
83 |
+
"stop_str": [
|
84 |
+
"<end_of_turn>"
|
85 |
+
],
|
86 |
+
"stop_token_ids": [
|
87 |
+
1,
|
88 |
+
107
|
89 |
+
],
|
90 |
+
"function_string": "",
|
91 |
+
"use_function_calling": false
|
92 |
+
},
|
93 |
+
"pad_token_id": 0,
|
94 |
+
"bos_token_id": 2,
|
95 |
+
"eos_token_id": [
|
96 |
+
1,
|
97 |
+
106
|
98 |
+
]
|
99 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1baee0573ad861622f16f1511a3a832f64b6f06daaa8606205bb0ac4f31104dc
|
3 |
+
size 704815104
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18123265c4e613e721f7ec214ddd128fd6524cf0f2ee2ea033a8c0d58a442720
|
3 |
+
size 88101888
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07aa81b35a08a718d168572569c9bd22fe1fae6d9f2361b70ae2923bf1ac811a
|
3 |
+
size 115605504
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80159080c38a19638afa76f6b8c469cac396b997ebcf7aeaf4781ed02d54cb08
|
3 |
+
size 115605504
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ef5c44a6579ccbdb031137e0cea20c3a8e484121f1ade811e05ba41b5242411
|
3 |
+
size 33030400
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b8a2c953472c4e90727aa119cb1815762e844b3effeb19544242d1e782b1b1b
|
3 |
+
size 30966016
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ba2dbe0d12ae36e61d68617944af05bf50dc8bc93c84e5d579fbd83e23d941e
|
3 |
+
size 57802752
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3c998073dcd66392c67f09478b30b94ac8cad2bce39926551b94f5dd3ff8721
|
3 |
+
size 57802752
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fa666a379ab045f0bed61627d71e735d784aff708c6e6e8b9e8f6b36de5e3c1
|
3 |
+
size 115605504
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b80ed171521576fc9460d02d2a2b4b37832cc3da741737851d617a9c86c2278c
|
3 |
+
size 20697600
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03f1575ee9f8321862c336c95c328a95831069351f254df0aebdd33024c7fee3
|
3 |
+
size 33062912
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82c553b62d7316f2d93ea22a964fc32a03fa77872d28868b0c60f49879a3248a
|
3 |
+
size 57802752
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e59eb9b85f29d64f89dec4ee989e86b3b272590a630d62b1ba63add5fbe6f62f
|
3 |
+
size 115605504
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a294cde95565dfa2dea489b23e98d99a23eab245a92b404444ef34d2b1a4e236
|
3 |
+
size 33083904
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3a013f12af746751ddcf4f0eac318e7c5b0e82823444cd7bfc1041e6e5ad18f
|
3 |
+
size 25815552
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60159195f1d4b07202feeaf5c5fa0eb0a0c825f23d409aebf0d2a5efe9b984b6
|
3 |
+
size 33062912
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:557f0d3a9aff8e23d1882d09ef923c2e13cae3cc4704ceb001b848597427aac1
|
3 |
+
size 57802752
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69e5c87abe3c4a1315b3a02e10c8ff35965849ee4914129732803b4622cf550f
|
3 |
+
size 115605504
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ad5ff8dd37b8ac56fb92392543bdf251890eb030b7af7b66faca227238ad4ed
|
3 |
+
size 25815552
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0118dda7b2d878baf28cc9753e307d128008b3e6470e32e9cfebb4b9f90ec38b
|
3 |
+
size 33062912
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92d5f4ad687eb70910dc5aea94faada78aed95b4bfc3ba53c137320b030b6dbb
|
3 |
+
size 57802752
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a479708896efaf846a23ad555948bd3d7e76c4862b60d121bac748d35af038e
|
3 |
+
size 115605504
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0df56a225e14f8a7822cb1f098bf69ae202b1a80e34dd2c3222c501b227b7a1d
|
3 |
+
size 25815552
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f975d84328ec8d80254929214f9896a26e842ce8d3f349d0cbf99f8d6e78541
|
3 |
+
size 33062912
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ceb166b0da490ce1327906f399c888c26c8076b540c29114c07d4487a8cbc85d
|
3 |
+
size 33062912
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f944874a3dd69a325b278516b1b991b2fb811fd800fa5352ae0ce55b975344da
|
3 |
+
size 57802752
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7cda5094f639263a1da3fd0d0755fb34a55d5daa442788cd9bd61f793d166bd
|
3 |
+
size 115605504
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:818fadd17d2fe78af437a68409b708b13bf7f55fae5defd1068aaef747da8ecf
|
3 |
+
size 25815552
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45c2bc896da95a3c6c7546b1f21863eb3bbbddbc37fd66a893b5508ea1fc6dd8
|
3 |
+
size 33062912
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5af118e1a04963a250e86fea3627cde1a5dafaa604d2afe9248705f33e95684
|
3 |
+
size 115605504
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:497abcd66b4c944f423e97b2585c3d3164fede0ebfa5bc9cc8099a28f0c3cafb
|
3 |
+
size 33030400
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6dcc796a2579711e842b37455ef734865a5d253f75bc8fd98d837c3c87351db
|
3 |
+
size 30966016
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4334c87023707a2f347e7cf80bdd3e761978499cc28d702a7438a3af14868b2a
|
3 |
+
size 57802752
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0322b960d91d180bc80513d09333523f84f8b5157e22a1e5a9c73b663b9534c0
|
3 |
+
size 57802752
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cf279529f1d67aa92e372f0403cb3749cb64de7d7ef73b407c117496228ffcb
|
3 |
+
size 115605504
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ab8ae6bc37498f335384a0334bf49609862103320e5dd49e9377dc938c8cc28
|
3 |
+
size 57802752
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:babeb91bf2ccc7e115146f247281f874fe5c51b5f7fe9a09d75847c1c8c45412
|
3 |
+
size 20697600
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b842ee4cea5fcf2b58d727000c12e5b5c7160fbba73d4a5881ec1405f65a1df8
|
3 |
+
size 33062912
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5025117a53891b2dcef690b80c85f97c9c71f3dc6a8ca288e87d9d8d3e7657b8
|
3 |
+
size 57802752
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4addceed45b76a3d6be88935aa735cb179b05bd1f99acd6abed6011f416eecd
|
3 |
+
size 115605504
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67f7e80632f97ad985fdc21205ac4bf8a32dc7e85eb5002597a2fdce037fc86c
|
3 |
+
size 25815552
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd3e34b863fe1bbfbe1f47ff384141be19662c942472bb2fd735a8498dfa0130
|
3 |
+
size 33062912
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b54f7c762e682913a848d43fce5d5982fa51676882dc4b7a4082b1146dbb9a0b
|
3 |
+
size 57802752
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62ee81ebb1851e39976174c87d26cfb08252f4e0a82b40bc507a1936af072b60
|
3 |
+
size 115605504
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65cf66a36375c1c9ba281c7ea771bc2547a155086b004badea118933744d83c9
|
3 |
+
size 25815552
|