Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- merges.txt +0 -0
- mlc-chat-config.json +72 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "qwen2",
|
3 |
+
"quantization": "q4f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_act": "silu",
|
6 |
+
"hidden_size": 2560,
|
7 |
+
"intermediate_size": 6912,
|
8 |
+
"num_attention_heads": 20,
|
9 |
+
"num_hidden_layers": 40,
|
10 |
+
"num_key_value_heads": 20,
|
11 |
+
"rms_norm_eps": 1e-06,
|
12 |
+
"rope_theta": 5000000.0,
|
13 |
+
"vocab_size": 151936,
|
14 |
+
"context_window_size": 32768,
|
15 |
+
"prefill_chunk_size": 32768,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"dtype": "float32"
|
18 |
+
},
|
19 |
+
"vocab_size": 151936,
|
20 |
+
"context_window_size": 32768,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 32768,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "chatml",
|
35 |
+
"system_template": "<|im_start|>{system_message}<|im_end|> ",
|
36 |
+
"system_message": "system A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
|
37 |
+
"roles": {
|
38 |
+
"user": "<|im_start|>user",
|
39 |
+
"assistant": "<|im_start|>assistant",
|
40 |
+
"tool": "<|im_start|>user"
|
41 |
+
},
|
42 |
+
"role_templates": {
|
43 |
+
"user": "{user_message}",
|
44 |
+
"assistant": "{assistant_message}",
|
45 |
+
"tool": "{tool_message}"
|
46 |
+
},
|
47 |
+
"messages": [],
|
48 |
+
"seps": [
|
49 |
+
"<|im_end|>\n"
|
50 |
+
],
|
51 |
+
"role_content_sep": "\n",
|
52 |
+
"role_empty_sep": "\n",
|
53 |
+
"stop_str": [
|
54 |
+
"<|im_end|>"
|
55 |
+
],
|
56 |
+
"stop_token_ids": [
|
57 |
+
2
|
58 |
+
],
|
59 |
+
"function_string": "",
|
60 |
+
"use_function_calling": false
|
61 |
+
},
|
62 |
+
"pad_token_id": 0,
|
63 |
+
"bos_token_id": 151643,
|
64 |
+
"eos_token_id": 151643,
|
65 |
+
"tokenizer_files": [
|
66 |
+
"tokenizer.json",
|
67 |
+
"vocab.json",
|
68 |
+
"merges.txt",
|
69 |
+
"tokenizer_config.json"
|
70 |
+
],
|
71 |
+
"version": "0.1.0"
|
72 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5054f71204822249b00bd4795141b482d480235f164b027cf4e6464cff03826
|
3 |
+
size 194478080
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07df9d18b57eae80485e4f71a90d74cf8bf9000beb738269c2ad4a9268504905
|
3 |
+
size 17694720
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2a2ee5cd9a54e57ab35136daf16d2bc837b262dde127881e0226033fb388374
|
3 |
+
size 17694720
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04735cfa263192b6276572d5928ceb7d3d11e026c06c1cb532768e63030415db
|
3 |
+
size 25956352
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55c703a4a4040052ac32c3ca2903c5aabb38d7670b76072c910cffc07d88fab6
|
3 |
+
size 17694720
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c852a5d75f0e59068a3b584b8b23a089ed84e86e33b38fe4e1aac8ea9513822a
|
3 |
+
size 25956352
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d1aece6821182ac7ed12b0c13f148c692ed112458ad7377e0d87ce09c1981ca
|
3 |
+
size 17694720
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5faea17dc7d024fd3a14f51e1acc33cea745f5e2655b3172f5eb955796dedea
|
3 |
+
size 25956352
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caa588f102f838b43f41532a5ca22b9eab53f47a17be4c299751d81bf07c597f
|
3 |
+
size 17694720
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07588d624e6217e1f5e893bcf7a8cb30ae59f0f5fe22a0e8f3367cea833dfbe6
|
3 |
+
size 25956352
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ecf59390be03d3fc9bd7b7685b01286cf55d25106f211a62019f8d55a688aca
|
3 |
+
size 17694720
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5acccb61da93b09ddf383eceedade2c1a718ef4e83951a4289ad856612bfb828
|
3 |
+
size 25956352
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89ab79148c17b16a45b77009716876a6fc4ee5ca7e45566c09a30e0f7b496928
|
3 |
+
size 30970880
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76207d95f1eb7b73a62f53427d32a6bae959d57c0a52f62e1a46b84417d30b69
|
3 |
+
size 17694720
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a31b16304ac506150d1bf0258d235ff8a57bf2852054fe7dd48292e33867d1a2
|
3 |
+
size 25956352
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a4695611335ab54244ca3f22c265781628a4e5b5c99c2a055bf66326bca3233
|
3 |
+
size 17694720
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f72dfaa4f07af63caf54390d1b5473d5fd7ff35733bb870c2bc73ecfa713507d
|
3 |
+
size 25956352
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:782989aa50f27319e3a4df654c8df6428f3181b2ec17afd2a7a49d8ae15b89de
|
3 |
+
size 17694720
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b49be62f5a8ff63ddbad15966d1482b8cecf34d17c1a6538747a29db51f03a31
|
3 |
+
size 25956352
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a91c2a770a72837268651aecac7ef7ef6b0ad7403544b833c12a97126705a73
|
3 |
+
size 17694720
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7574197dd7a8f44c1f2d2e681d2de02f19986a23d250fe919c1b5f3a2f520a5
|
3 |
+
size 25956352
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:529bf64b8a7082fd571cb06eea78bc938dee13bcf717d80a716651473d03c711
|
3 |
+
size 17694720
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c326908607b3329dac8b6ce05aae2b9ec1190a101832ed4dd14478d4a86fe0d5
|
3 |
+
size 25956352
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5ee1d4408cf3bc8ac5061fac16c3e4ab1f6c51a7e52a7741d15662608643745
|
3 |
+
size 32837632
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aba9bf849e1d8c93b01dd81f4c958f935956437da87d9ae290d5144af917936e
|
3 |
+
size 17694720
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dcaaa11e0748738d2104eb75b2dd2162e8b625edf68820cf6ee3ba613e984df
|
3 |
+
size 25956352
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8817963ae1bb2be36dac335b80039ff5860f32c06c40ad5423ec4948d1eb5d92
|
3 |
+
size 17694720
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19ee0dad98636bd74e2a2edfb7a3d73fec38854ff540f528385c5aa1cfbb5346
|
3 |
+
size 25956352
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6095cf141423ebf32a7912ac31a8ee91f451cf5f6838068c30a39ae9c3c39df3
|
3 |
+
size 17694720
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26fa3ffee2e77b8407aae149946a3bc2810bddf1a6fa8ace11a58949d7a0ff41
|
3 |
+
size 25956352
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68f23aaa6d78a88b0f1e133f5d657ace329a3055f0a71bffded6ab40b5c29bcc
|
3 |
+
size 17694720
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a327653084442e8d951640aa0233933d09b2e6066684bd2c5ef21713a4e2c342
|
3 |
+
size 25956352
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bdf92ba789fcee33d5f5f0c59c706a807fa700f57761be3344a59d5f90621b6
|
3 |
+
size 17694720
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0a6147df11b218a3f1152410b24760bc275e1c78d9b3171498cfc1f76303979
|
3 |
+
size 25956352
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9aa5077d77516d51fabbccca96cffc13fde75c874e51a058f3fc2ae0ca8f942
|
3 |
+
size 17694720
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adc254053a2f5d7f49b14bd36ca6ed710beb80d0bc63f3a93f9e40e44a086714
|
3 |
+
size 194478080
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a9f59221a28fa3c8d2f404920e615f50ee9e517830c0db18a021747b0629273
|
3 |
+
size 19447808
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83db61185c5ba856c4137d93ef8e5f44c327f6a9e7f14aef7ce62cbcf8c5ad47
|
3 |
+
size 17694720
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23a7347558213b0ceb6fe7b670f1c3bbf5aaa38cbf653a0713ac23d5fa7e8d82
|
3 |
+
size 25961472
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d4f19ed1128ca36c93a0eb63a1e3013c6aa69b7b9d1037dd2cb3d561a513b08
|
3 |
+
size 17694720
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a6827a244c2b85b800d9cc58d8ec063cfbaf584be758db7ee5d34b0e13e53e4
|
3 |
+
size 25956352
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd8d837104f08edec9c762ea756e09dcb0033cd74a9f5e57c101a399b4aa95c2
|
3 |
+
size 17694720
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6417602116e5f6fd0654247581ec1d3d0724680b4d8e79327a515bddb63ade2a
|
3 |
+
size 25956352
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c50519893e3a22372c5a6db31774ab3c55a0b59bf931f87bf14627b054a03457
|
3 |
+
size 17694720
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d46d5a7a563e6eeb1904982ed27ea24627c3c88c1ecab4b321228c7bb4eab615
|
3 |
+
size 25956352
|