davidgortega commited on
Commit
9b2b582
·
1 Parent(s): 292a2a6
This view is limited to 50 files because it contains too many changes.   See raw diff
Q4/added_tokens.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "\t\t": 50294,
3
+ "\t\t\t": 50293,
4
+ "\t\t\t\t": 50292,
5
+ "\t\t\t\t\t": 50291,
6
+ "\t\t\t\t\t\t": 50290,
7
+ "\t\t\t\t\t\t\t": 50289,
8
+ "\t\t\t\t\t\t\t\t": 50288,
9
+ "\t\t\t\t\t\t\t\t\t": 50287,
10
+ " ": 50286,
11
+ " ": 50285,
12
+ " ": 50284,
13
+ " ": 50283,
14
+ " ": 50282,
15
+ " ": 50281,
16
+ " ": 50280,
17
+ " ": 50279,
18
+ " ": 50278,
19
+ " ": 50277,
20
+ " ": 50276,
21
+ " ": 50275,
22
+ " ": 50274,
23
+ " ": 50273,
24
+ " ": 50272,
25
+ " ": 50271,
26
+ " ": 50270,
27
+ " ": 50269,
28
+ " ": 50268,
29
+ " ": 50267,
30
+ " ": 50266,
31
+ " ": 50265,
32
+ " ": 50264,
33
+ " ": 50263,
34
+ " ": 50262,
35
+ " ": 50261,
36
+ " ": 50260,
37
+ " ": 50259,
38
+ " ": 50258,
39
+ " ": 50257,
40
+ "<|im_end|>": 50295,
41
+ "<|im_start|>": 50296
42
+ }
Q4/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
Q4/mlc-chat-config.json ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "phi-msft",
3
+ "quantization": "q4f32_1",
4
+ "model_config": {
5
+ "model_type": "phi-msft",
6
+ "vocab_size": 51200,
7
+ "n_positions": 2048,
8
+ "n_embd": 2560,
9
+ "n_layer": 32,
10
+ "n_inner": 10240,
11
+ "n_head": 32,
12
+ "rotary_dim": 32,
13
+ "position_embedding_base": 10000,
14
+ "layer_norm_epsilon": 1e-05,
15
+ "context_window_size": 2048,
16
+ "prefill_chunk_size": 2048,
17
+ "n_head_kv": 32,
18
+ "head_dim": 80,
19
+ "tensor_parallel_shards": 1
20
+ },
21
+ "vocab_size": 51200,
22
+ "context_window_size": 2048,
23
+ "sliding_window_size": -1,
24
+ "prefill_chunk_size": 2048,
25
+ "attention_sink_size": -1,
26
+ "tensor_parallel_shards": 1,
27
+ "mean_gen_len": 128,
28
+ "max_gen_len": 512,
29
+ "shift_fill_factor": 0.3,
30
+ "temperature": 0.7,
31
+ "presence_penalty": 0.0,
32
+ "frequency_penalty": 0.0,
33
+ "repetition_penalty": 1.0,
34
+ "top_p": 0.95,
35
+ "conv_template": {
36
+ "name": "chatml",
37
+ "system_template": "<|im_start|>system\n{system_message}",
38
+ "system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
39
+ "add_role_after_system_message": true,
40
+ "roles": {
41
+ "user": "<|im_start|>user",
42
+ "assistant": "<|im_start|>assistant"
43
+ },
44
+ "role_templates": {
45
+ "user": "{user_message}",
46
+ "assistant": "{assistant_message}",
47
+ "tool": "{tool_message}"
48
+ },
49
+ "messages": [],
50
+ "seps": [
51
+ "<|im_end|>\n"
52
+ ],
53
+ "role_content_sep": "\n",
54
+ "role_empty_sep": "\n",
55
+ "stop_str": [
56
+ "<|im_end|>"
57
+ ],
58
+ "stop_token_ids": [
59
+ 2
60
+ ],
61
+ "function_string": "",
62
+ "use_function_calling": false
63
+ },
64
+ "pad_token_id": 0,
65
+ "bos_token_id": 1,
66
+ "eos_token_id": 2,
67
+ "tokenizer_files": [
68
+ "tokenizer.json",
69
+ "vocab.json",
70
+ "merges.txt",
71
+ "added_tokens.json",
72
+ "tokenizer_config.json"
73
+ ],
74
+ "version": "0.1.0"
75
+ }
Q4/ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
Q4/ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
Q4/params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4b95e1f45739e2328f291d359f1c96274954e547467cb34cf1c97e6dae2840e
3
+ size 65536000
Q4/params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccef00b8d4f3b660ce29c555710532a6ab198f50591f643905b25a20621c8821
3
+ size 23091200
Q4/params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df5b7d8c5f1accd5a6636b1e86d8b9f4733b384d1d7951a03f2e7f3a26a74054
3
+ size 29521920
Q4/params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d55e06b1a2d4af3b75dbf30874c1c1ba04dd7082ba3a72fcf7bfe24ea1aded8
3
+ size 29542400
Q4/params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e436782faf7c1192cce4a6d5c82030b345a9315d89f2f82554b233aa42fa277f
3
+ size 29521920
Q4/params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de09f2311dc9f5074c626b72244328aea0332a6848cc8c3bfab22772d14f7145
3
+ size 29521920
Q4/params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0753154b5ee4680e7f9f7e15c5d870c262d3b4e28d1c175da65fe12fcbac7ece
3
+ size 29542400
Q4/params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8e6ed6f3b45d5d5a598a163272d47087f5f617033ef6860a49c360162afbb86
3
+ size 29521920
Q4/params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cac09098f916b0381169e17fb1196ed034b8d90c2dedf769568403e20da37ce
3
+ size 29521920
Q4/params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a19ae63e4dd75006db9a053736fa204014b88a6498491a116a4ba3ccd71a0b5
3
+ size 29542400
Q4/params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a267eba85412b74344d3efd7a37ed93117eca91a8265986e6fea2f3025ce160e
3
+ size 29521920
Q4/params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5651d41313946a9b440c26e8afc44193de112321ba1a9ead35e153538f3a921c
3
+ size 29521920
Q4/params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec6bffa22123aec682470d5c8cfe252c44bb2a7bc013683eb930022086e89c53
3
+ size 29521920
Q4/params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1301faab07797091d8b6350f6d4ce1a8735cdf8d1f85afd2cbce5080e2bcbbef
3
+ size 29542400
Q4/params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:953a7bc687d5710400f5c6c2f7b53fd3609d6b329c7daae3607e69401c6909bf
3
+ size 29521920
Q4/params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e749447891d675ea00200df12ddfd3998775f17ccd331ff1a053133c7db5b1c7
3
+ size 29521920
Q4/params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4801702e8e2e2e1f42a1c57ae8ffccad2afcfea9172f4724f8f11bde464c8022
3
+ size 29542400
Q4/params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0c251282f583f6648d4447fa348cd3c03e6a00584b24c087271f2c21b0f5f6b
3
+ size 29521920
Q4/params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f0c8e54cdceedf53b4ff1bcbafe98238b42d69a10476c79799c2f301a6b74a3
3
+ size 29521920
Q4/params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:079ed7a03daa12ec52538a64032b00b1498446fbd6637b5dfbee0280123b1e80
3
+ size 29542400
Q4/params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f41c63de2204ba1f1615edef6b9c0ae850f5e3ca9ce0047ceda10c677de617e3
3
+ size 29521920
Q4/params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc88e212060764796598ca13c6ee1393951504c92212318b5d7018912ea7676e
3
+ size 29521920
Q4/params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cba076c80c0cbdbd56b04f56188fa9eadfac41d1578fbf88e8793aa03ab840ad
3
+ size 29542400
Q4/params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d489696fa8dd1f461e7c15dd66d22def80395b0c1bf1bad30874f4d1c01b30c5
3
+ size 29521920
Q4/params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2701bd507840e5614c4e10dbd0f1651486867951c0271b446dbd6f5182e56cb3
3
+ size 29521920
Q4/params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6d8ecb026a0bf35f77a5ebd93b0b0bd947695000ae9550ac0d30d39533e32fb
3
+ size 29521920
Q4/params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:924638ee72c1ca3d9a84bf4ae9a4882f7d91cf7a138be5b541cab4422f7ad1af
3
+ size 29542400
Q4/params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bff7d48f6f85ea0980ce6f7455c1ce9cd19bb47e1b2855fa88d6034363a4a7e
3
+ size 29521920
Q4/params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9689b8351036c24f100f450fee9c82f86214494e3aa67b2ab6ff017a9cf6164d
3
+ size 29521920
Q4/params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3afa86ec9ec160f2171d7eec890a47731a4d81458ceb9ce119a730271ce6af1d
3
+ size 29542400
Q4/params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:423e57402c9a796b35bc9452e86086d46203a0b8711901950302c1192cf718e7
3
+ size 29521920
Q4/params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dde0e5b0b18d1d8d35bd97327c466bbf2bc4ee8a5031eec3dc67f100474f148f
3
+ size 29521920
Q4/params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbef37e188ba6b06e1f2ede88a332783bc87b6cd32ce4f008117ff817e6ae473
3
+ size 29542400
Q4/params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e3f287dc7e2d3b9e7a8571e9564afc3c01a8f2fa87094d363a98f2a2eba181d
3
+ size 29521920
Q4/params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96876669a486a16c3542f95b3ff51b3d69b712515f7a9924137a167e1a9247fb
3
+ size 65536000
Q4/params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:168b8ef1bddfe748e0e15b6bf7e7b132b83bb4c6b63292bb01ce3003f4134da2
3
+ size 29521920
Q4/params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ef43fdf94042275615cbf39e9463a5db3d97c9047ed5bffba978171e3a7124a
3
+ size 29552640
Q4/params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2f54bfae1bc0f74edbef9fbb697ac1cb7fc9b6840c8ce3c30ff0603b01e71a3
3
+ size 29521920
Q4/params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2faa6faf3876765c3706faa5c68a05fa812379718802e435f4560ec340cfbd32
3
+ size 29521920
Q4/params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97161f17d4c837463d5fa0d7ef3a5a9ae8747ceb2d4455c5040752eb33088249
3
+ size 29542400
Q4/params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4420978cb2607413ebfcbce12f9141aa4edd491224eeb7150f8bfd8843ddca60
3
+ size 29521920
Q4/params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:683f8d750932903a226b0f1cd338e5de4d479201879c8d4f06518559a2202f1f
3
+ size 29521920
Q4/params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22caa03317f257c2b1513283453b1f8b6d4aae2cc74743873a4aaed924e1a503
3
+ size 29542400
Q4/params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79421d672c13266aeab402b76af4aa91945e0fd4b60a8218431556dbe78c41f0
3
+ size 29521920
Q4/params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccbc1a21d0ecd77ebcb777040d9d5aa5e00d2e9acca23dc1c87ca70774458da5
3
+ size 29521920