riczhou commited on
Commit
32356c5
·
verified ·
1 Parent(s): dc31d16

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
mlc-chat-config.json ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "gemma3_text",
4
+ "quantization": "q0f16",
5
+ "model_config": {
6
+ "text_config": {
7
+ "hidden_size": 1152,
8
+ "intermediate_size": 6912,
9
+ "num_hidden_layers": 26,
10
+ "attention_bias": false,
11
+ "num_attention_heads": 4,
12
+ "num_key_value_heads": 1,
13
+ "head_dim": 256,
14
+ "rms_norm_eps": 1e-06,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "position_embedding_base": 1000000,
17
+ "context_window_size": 8192,
18
+ "prefill_chunk_size": 8192,
19
+ "query_pre_attn_scalar": 256,
20
+ "sliding_window": 512,
21
+ "kwargs": {
22
+ "architectures": [
23
+ "Gemma3ForCausalLM"
24
+ ],
25
+ "attention_dropout": 0.0,
26
+ "attn_logit_softcapping": null,
27
+ "bos_token_id": 2,
28
+ "cache_implementation": "hybrid",
29
+ "eos_token_id": [
30
+ 1,
31
+ 106
32
+ ],
33
+ "final_logit_softcapping": null,
34
+ "initializer_range": 0.02,
35
+ "max_position_embeddings": 32768,
36
+ "model_type": "gemma3_text",
37
+ "pad_token_id": 0,
38
+ "rope_local_base_freq": 10000,
39
+ "rope_scaling": null,
40
+ "sliding_window_pattern": 6,
41
+ "torch_dtype": "bfloat16",
42
+ "transformers_version": "4.50.0.dev0",
43
+ "use_cache": true
44
+ }
45
+ },
46
+ "vocab_size": 262144,
47
+ "tensor_parallel_shards": 1,
48
+ "max_batch_size": 128,
49
+ "context_window_size": 8192,
50
+ "sliding_window_size": -1,
51
+ "prefill_chunk_size": 8192,
52
+ "is_text_model": true
53
+ },
54
+ "vocab_size": 262144,
55
+ "context_window_size": 8192,
56
+ "sliding_window_size": -1,
57
+ "prefill_chunk_size": 8192,
58
+ "attention_sink_size": -1,
59
+ "tensor_parallel_shards": 1,
60
+ "pipeline_parallel_stages": 1,
61
+ "temperature": 1.0,
62
+ "presence_penalty": 0.0,
63
+ "frequency_penalty": 0.0,
64
+ "repetition_penalty": 1.0,
65
+ "top_p": 0.95,
66
+ "tokenizer_files": [
67
+ "tokenizer.model",
68
+ "tokenizer.json",
69
+ "added_tokens.json",
70
+ "tokenizer_config.json"
71
+ ],
72
+ "tokenizer_info": {
73
+ "token_postproc_method": "byte_fallback",
74
+ "prepend_space_in_encode": false,
75
+ "strip_space_in_decode": false
76
+ },
77
+ "conv_template": {
78
+ "name": "gemma_instruction",
79
+ "system_template": "{system_message}",
80
+ "system_message": "",
81
+ "system_prefix_token_ids": [
82
+ 2
83
+ ],
84
+ "add_role_after_system_message": true,
85
+ "roles": {
86
+ "user": "<start_of_turn>user",
87
+ "assistant": "<start_of_turn>model"
88
+ },
89
+ "role_templates": {
90
+ "user": "{user_message}",
91
+ "assistant": "{assistant_message}",
92
+ "tool": "{tool_message}"
93
+ },
94
+ "messages": [],
95
+ "seps": [
96
+ "<end_of_turn>\n"
97
+ ],
98
+ "role_content_sep": "\n",
99
+ "role_empty_sep": "\n",
100
+ "stop_str": [
101
+ "<end_of_turn>"
102
+ ],
103
+ "stop_token_ids": [
104
+ 1,
105
+ 107
106
+ ],
107
+ "function_string": "",
108
+ "use_function_calling": false
109
+ },
110
+ "pad_token_id": 0,
111
+ "bos_token_id": 2,
112
+ "eos_token_id": [
113
+ 1,
114
+ 106
115
+ ]
116
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4917a670473e45b676f9d6a1e2789ad4d66e4bd23bacbd5f0a10d06194995ae5
3
+ size 603979776
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5907744924478281f8fd791f062d2a6acc41f6183db8c00e25047d783b4ed57c
3
+ size 31850496
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e1496898a17d146205e9a2e4858644c54079b915328471b28179b481f9f73ec
3
+ size 21833728
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d33b4c24bab565b1568888c83d3294f3c1989bb4b56d0b4cd73acc285e26623
3
+ size 31850496
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1521eecca1eb8ba038ed7e447afca104146758445d765514426279840c708193
3
+ size 21833728
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94fee4e0b0f160875869fb13b5f27936dce3841d9fc3d5fc754b986b19446862
3
+ size 31850496
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30a6df5435a07d97374f6380f069ab104a225b0bcce1278d63e059e3ca4d532c
3
+ size 21833728
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5276bcc26350d6546e93896671112e7657573a5b187779328f6d9c58e1afe09b
3
+ size 31850496
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58d800b892b4d547b584654747bdadf57b7168fda1d1d158e3a2d7d7c61f98b9
3
+ size 21833728
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c75925f879dbcd76003bcd59d6fcdc3f7857546f09af926d24e4148ac0b65985
3
+ size 31850496
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:955db852dae46a197e791dd91030931664bad9f43c6e42f9dbc6aaeba0d505f1
3
+ size 21833728
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a2e2fb8de161b52ab8cf25e624790c24e92c06dfacbabc4aa6efee07e29bd94
3
+ size 31850496
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a6e97a38806a38b60ec61ff2d02b851760240839c68af8e1141d23089ac1101
3
+ size 21836032
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a58d854ec0a375e6d5f9229eebbdeb34ecc3e18dc22f770d2603df32aab828ef
3
+ size 21833728
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffe4ad86818ad6f4d8c8f4f8a566a76059d0ba55b955fc2a5af3b47cefd724e9
3
+ size 31850496
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c751a09a5832e03c9b542d559c371b3479b793065ca89d5cce0f07bdbea49bb5
3
+ size 21833728
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8505b89e891f0858dfff51233190df882e381a619a935f251ebb6aa4d95b570
3
+ size 31850496
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5194cd64d0e08e5fcf93d08c1d22740ae6e4505d024e664919a221a480ac5619
3
+ size 21833728
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:912d4fdbcfc37ae5cb00ef5d2506074c759be1f63ad984f44a32a8172c4cc7ac
3
+ size 31850496
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8c278887b8003f22c07620f32c5b3801de66e895e7c0b819c96b812c37a854b
3
+ size 21833728
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf9eadc03277c7d849a2c904fdc85f4797446aad9aff7c0392a0d32fd24e22dd
3
+ size 31850496
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a6806fd4999d1cd16d02a1c1913d4865ae7d0a4209f6253984d71fe3ce7a36e
3
+ size 21833728
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad97b7c04257f8f161c63e37570b65c9acfbb858a5d82ca44bea39c990f444d6
3
+ size 31850496
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d6ec1d4860fbc2ff729650382caa0d2f4e45853a538541f32ccf8b889d63625
3
+ size 31850496
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3f078ac2b500a955136f04ef3a6e223a55625173168a4684216bfba2ad4a9c3
3
+ size 21833728
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b010a676019a63812d40b7f70d0f663dbe546eda0536c53e043706590ab205e0
3
+ size 31850496
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a6cd2997a20781cba73738b027c4f7c000f8613f02bc90d13b9dff070a79131
3
+ size 21833728
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bdbb71700bb4c254b43fce17ea8351bf965e151d07a3c23eb6c73af02bab28b
3
+ size 31850496
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a448fb405e7b47ed81e1343b7cedcc05851eec885e3c466a52b17ea6c5d218b7
3
+ size 21833728
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a9ff196369726c90f88f3e56f438af718ecc5f37889dc518e4eff4d1c0a4b8e
3
+ size 31850496
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01a29574fbb8631b87ca108073e1caf90e868101bba945fa75ffa5dd975baf64
3
+ size 21833728
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:571de45f55ccfb58dc7737aba7816508666e1741bab44bd150dce21f521d13a3
3
+ size 31850496
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a478e7f64f4db442e4295eee13ba428802249e3c0f1eb4b4fa371752ad4676e0
3
+ size 21833728
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfde9f9c332d9368c3ec685f3460f5bbdea8b01f3f34440f9937e51be4d69516
3
+ size 31850496
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db4c6e9e12f0487c7bfc12c8bb4e37b8cd5a665a0d2b3845c967763b0b7190b7
3
+ size 21833728
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f113fe349bb6b38102033e8bf21d8a6dc3d80a8ca1247820d294f59c2d175bb1
3
+ size 21833728
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16433310070ee5ee752f1882ee7b0615ca01172d7f73fb1d72ab0c862678f7b0
3
+ size 31850496
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ace9ba966d93738d04d997342697d46ffd592f695e1fe1a8b731ca2b01a24baa
3
+ size 21833728
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29ada429e15074ce946bf4c7f957299fab609b7cc3fa70358169d84f22adc912
3
+ size 31850496
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9133a1980e72278e10eb5766870d41217096ae10d23a7316885ef70fd568ef3
3
+ size 21833728
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bbf52ea507228d1e4f5808a62a03b0fd0cd118af11084019d599c5d1d59a5cf
3
+ size 31850496
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a51b4ae96a97e9975553f625a716a6eb134c179a9b4a64e92d388da0b99937a
3
+ size 21833728
params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcfb4b1221faf67668dae1f7242af76422e5206b3274a25178147f027fe9f280
3
+ size 31850496
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8cfe2fc5558bfd0b1ba8d9fb683ed28cf75a9a95f6f38761b2961c5f7d0a416
3
+ size 21833728
params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bf29028380a6a1d2cd0306a9cbec04b2472742d191fc5d5371802bba7541e14
3
+ size 31850496
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4549bf7a87a6c8ec601ef051ee92d283588db7c53b2e74052f0a69645d30d573
3
+ size 31850496