Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +41 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_neox",
|
3 |
+
"quantization": "q4f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"use_parallel_residual": true,
|
6 |
+
"hidden_size": 5120,
|
7 |
+
"intermediate_size": 20480,
|
8 |
+
"num_attention_heads": 40,
|
9 |
+
"num_hidden_layers": 36,
|
10 |
+
"layer_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 50280,
|
12 |
+
"rotary_pct": 0.25,
|
13 |
+
"position_embedding_base": 10000,
|
14 |
+
"context_window_size": 2048,
|
15 |
+
"head_dim": 128,
|
16 |
+
"prefill_chunk_size": 2048,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"ffn_out_dtype": "float32"
|
19 |
+
},
|
20 |
+
"vocab_size": 50280,
|
21 |
+
"context_window_size": 2048,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"mean_gen_len": 128,
|
27 |
+
"max_gen_len": 512,
|
28 |
+
"shift_fill_factor": 0.3,
|
29 |
+
"temperature": 0.7,
|
30 |
+
"repetition_penalty": 1.0,
|
31 |
+
"top_p": 0.95,
|
32 |
+
"conv_template": "dolly",
|
33 |
+
"pad_token_id": 0,
|
34 |
+
"bos_token_id": 0,
|
35 |
+
"eos_token_id": 0,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"version": "0.1.0"
|
41 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9976b806ae9108ef3be3ba927140c7b404b894b4f9b3ce03d5b9470953596ebb
|
3 |
+
size 128716800
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b98ddda72590be02f3c8bda213aebe578bcbba289327c4c9ed3a936b5ec6a0ed
|
3 |
+
size 39321600
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76dfe73daae47e483f7d21725677f920e964a4f7c5c217c7f2fe25078821a4af
|
3 |
+
size 32901120
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b05c6f7c8ef154813112e1303f7666abd10eaf724734d9bc5866fe1c3de7630
|
3 |
+
size 52428800
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:032863019d275bc9b52cdff8e0afaaa9e6ef4d18bc86fdc1324f3fe72b7f3c69
|
3 |
+
size 39321600
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00913192f532777a024810394d9026fad4869a71b78fc621a21732321194fbd8
|
3 |
+
size 32901120
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:790629a23b9f5ee426a33c2fa36bbfe8787510de3173d6f70d0dea87527667d3
|
3 |
+
size 52428800
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1d2d376a1ff5ae04cd92ce2d40be9c91e6cc721b2468b425101069652e79c01
|
3 |
+
size 52428800
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e55b8f9839e854a042d77b467128ea797b1db5d8efb1557346006ca7c1cee33e
|
3 |
+
size 39321600
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c035055e176671a9096067825549babfeda5fff9db8a7d0d213ed4939925fcd9
|
3 |
+
size 32901120
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38cfd6b7514997bb6c4157b853f0c2972f3cb99a647f94b97cd183eefdf5c13e
|
3 |
+
size 52428800
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80d24ab890bb230412c06b6c2c7508c861cf62245c7c611dc0eb740b8c5be8b6
|
3 |
+
size 52428800
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdf225d650e3eb8d32fc4e47d0db7bdb87694b4d0432c7d95ae5394347174e87
|
3 |
+
size 39321600
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ba85159738dbe0f54bc48b7d77fa484f6100ee513c07f438f20842fa490d104
|
3 |
+
size 52428800
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1759973358629fba694c68af30d5d4dbcc4ef4da8495d955b99ea3334b1ce1a1
|
3 |
+
size 32901120
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0df6f94290a4fcfc1ae989bad38a90f85dd8fd7964df1d1b8ef49a1f107b9af7
|
3 |
+
size 52428800
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47deda44de0f8a655ce5dfbdfe08ccada0ac2fbe146408aac6daf68088133d5a
|
3 |
+
size 52428800
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c5c182f1bb32d7f78119621ddb16931ef5824d76e66b4fce77926e60edfbb54
|
3 |
+
size 39321600
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b43945f3c9ee21bdfbdc4327345cdfa3a4e67c6b9fe5ba8a5cc5ce853cf09fa1
|
3 |
+
size 32901120
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56bee70f8c09478c5c4ce5c7e8c39b009c55f8f2202e60b3515f64e4f06f84d5
|
3 |
+
size 52428800
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2eb51b011481ddd990b9a382556be68855165155443fff3e9087bd4961231d9e
|
3 |
+
size 52428800
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:318da5af7f9e0cc0813cfd63f86cd4d85c82d1c0ea086dbafae5180d9b0edae3
|
3 |
+
size 39321600
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c06b92c7c421afa79fec4119cccec1f341ccecffa42c176b366bbbae5adece3
|
3 |
+
size 32901120
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c2774faa261dc4a86ee92959ac646a5eb2f272182d2f66aa19a90d4e44b36c1
|
3 |
+
size 52428800
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5cc20b136854a19e193cce36be69861bc0e4f978ef2cba6ed1857b5b65bd0af
|
3 |
+
size 52428800
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee442c1fd97fd869ec6b23d77fa78b792347f89add6c13e649ae426441f72811
|
3 |
+
size 52428800
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc0563e73e623e62e1e454a12cdfe4f26a97ca2f668cec619bd64722d29b4e12
|
3 |
+
size 39321600
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8beb135d1d8f2ca98b17a9749052d3a8c32a7eeb56618a3af9a4459f8937b89
|
3 |
+
size 32901120
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:447b588232a02c02c19b9cf905a2c6636a3789ec130897b741fb98e578cb180f
|
3 |
+
size 52428800
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21ceb71b41ba714453f9bd2b7a8330d0a4da119e71b94fac6763eff82d3f0be0
|
3 |
+
size 52428800
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9705444134f42c981351a2e1e14265d5f5e4cdd1dd670e92ecc3e5e71b0569b
|
3 |
+
size 39321600
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f99196434e3be2c9ea7249301fe170bf4d2cda5a46d4c108476ff98a2cca79c3
|
3 |
+
size 32901120
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d7fb00c29760d3d2e38292b1ef8173eb13ecf4e04343218c3771e70273e8557
|
3 |
+
size 52428800
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5f51007bfa801da002a47ef5065b2931cec21f7c1673763fbf138e789a18f5e
|
3 |
+
size 52428800
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b791400e017d307f01e0ffbc2cdadb4161cc6a1ad23b96b9ff44519a9dfc0201
|
3 |
+
size 39321600
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56842fbc430608687bed499c23316e519d0b69bc125a4379edd47adc0c346401
|
3 |
+
size 39321600
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59f9e7fb402889ad2f5291a5b9efbbf661167a2afd13fb08e1e41a0ed546d83a
|
3 |
+
size 32901120
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c621beac8fe1938e8e131e1cc0f2fca34304860c029d5caf6ee4c7ec3f3e42b7
|
3 |
+
size 52428800
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d701f3c97e4cc3a42723e638b0c7882b68afe253cec919afdf18602426b2eba
|
3 |
+
size 52428800
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d972ebe8c817acd3d601df7987a6f0f33c3ed64cb0c941a7daddcc0bd25f37a
|
3 |
+
size 39321600
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ce647982e689b905cb01d288bcbfc8e3a955cbb48f6c5d5494d8c32e1a1d5b8
|
3 |
+
size 32901120
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4373d3db0bf37fd21a4371f0c1c6a4d07fa7e427f48d5550c70bceaebeb1bf9
|
3 |
+
size 52428800
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f533ca207a4efa162c5331274659a53b0a003f9db33011d9e0d4982fc4708880
|
3 |
+
size 52428800
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82d7968ee1952f066a80e16233e611b97d096c54169d59a7dcbd3f32bc6b5e7a
|
3 |
+
size 39321600
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:323ed26e6afd714e117ba1b747d37f74305cf647af43f908966e32bcfe0f50a6
|
3 |
+
size 32901120
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15b1ef3dacea137ed264e2a34e1ef842c9af41b294ddbaf7d6fbf9c5f705b8cd
|
3 |
+
size 52428800
|