junrushao commited on
Commit
1a7b90d
·
1 Parent(s): a79b64d

Initial commit

Browse files
logs.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "gpt_neox",
3
+ "quantization": "q3f16_1",
4
+ "model_config": {
5
+ "use_parallel_residual": true,
6
+ "hidden_size": 2048,
7
+ "intermediate_size": 8192,
8
+ "num_attention_heads": 16,
9
+ "num_hidden_layers": 24,
10
+ "layer_norm_eps": 1e-05,
11
+ "vocab_size": 50304,
12
+ "rotary_pct": 0.25,
13
+ "position_embedding_base": 10000,
14
+ "context_window_size": 2048,
15
+ "head_dim": 128,
16
+ "prefill_chunk_size": 2048,
17
+ "tensor_parallel_shards": 1,
18
+ "ffn_out_dtype": "float32"
19
+ },
20
+ "vocab_size": 50304,
21
+ "context_window_size": 2048,
22
+ "sliding_window_size": -1,
23
+ "prefill_chunk_size": 2048,
24
+ "attention_sink_size": -1,
25
+ "tensor_parallel_shards": 1,
26
+ "mean_gen_len": 128,
27
+ "max_gen_len": 512,
28
+ "shift_fill_factor": 0.3,
29
+ "temperature": 0.7,
30
+ "repetition_penalty": 1.0,
31
+ "top_p": 0.95,
32
+ "conv_template": "LM",
33
+ "pad_token_id": 0,
34
+ "bos_token_id": 0,
35
+ "eos_token_id": 0,
36
+ "tokenizer_files": [
37
+ "tokenizer.json",
38
+ "tokenizer_config.json"
39
+ ],
40
+ "version": "0.1.0"
41
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b36c8099f0833ec3a2f8bcd703a383162340c7fb040d43b69f8f21f09621e6f
3
+ size 41852928
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd62744e450fa66e74135795edeeeedb07ccd006adf6b7b1b853b2b3606554b8
3
+ size 33305600
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54f63837628f33883bdb638a8b615f16a99bcfbd3f62214cc0bca86390aa52c4
3
+ size 30629888
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c30a347bd21d22e8cc295ec0cfd5d4936bd7e6f0e907a7bace4b967a56b2bfe
3
+ size 30629888
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d7987bc39743f3e902380e5709394e0d9b6af25b643f73bdf6aa25d5f30e4bd
3
+ size 30523392
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:420be6b550b92218e68d806833aaa0274f1b5c9ae3b00a8eac173c462a4f4eb6
3
+ size 30629888
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:682c96e4fe877b6d4a4fbfee2c8879a24fe2f86d04d32c461f158d81343daf5d
3
+ size 30629888
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7373943b052609e0a1ff3142b0e2e36c42fa6a6ba05ff7a63f938187ce8cf2bc
3
+ size 30523392
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3271cd5026068e6c97a5d4600ddeb774a3708a6fddc1493eb8f992fb4af13a90
3
+ size 30629888
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9b9feea27aaa3078bc9cf4582317c5c26c1dba9385ba58e7c6a89c6299a0a8a
3
+ size 30629888
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02a7deba87c6fb2c5b4859889586b296b78d07acb4c05d7f2dbf9874f9a3b9b8
3
+ size 41852928
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b74a5870510d6bafdbcd759ded63caf641d42b6d55fc5b9714a45a96d0bd59f
3
+ size 30515200
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8075a7d1f6667c65ae8f87088821cde53c8f6a0e79fb2c21a547ad7528217b97
3
+ size 33202176
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:948e96888f3d5831314229b8d87590532402634e3824a5432e565e8744fdac7e
3
+ size 5231616
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca1e0e23f8847e65a5be9273e121d2d693616f70e3f8381c942792e387fd24dd
3
+ size 30523392
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f316896b60496b7cf0547862df4f09e150b6ba86dcbc2d92f04a5353f8f70aaa
3
+ size 30629888
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:873d47d37df390bfdf732a15d0e1a6baa141efc7ef469a224ee26d955bc15d2e
3
+ size 30629888
params_shard_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb085ade9c0c055c0f6540d351e1a82d52881982443fee9773901ebfd7e086de
3
+ size 30523392
params_shard_7.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be4a29860865b809c330006252d900499aae4a942902bd73f8c9ec4abce9b709
3
+ size 30629888
params_shard_8.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba4d8c2aa6bc6da00ac021598e4a40d4983b7b2a62bba7988f716b3600e809d9
3
+ size 30629888
params_shard_9.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ffa12f6c547ee69854662816bdccd5fef0ec3287aa6c3c3b24d10600fb8698e
3
+ size 30523392
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": "<|endoftext|>",
4
+ "eos_token": "<|endoftext|>",
5
+ "name_or_path": "EleutherAI/gpt-neox-20b",
6
+ "special_tokens_map_file": "/admin/home-hailey/.cache/huggingface/hub/models--EleutherAI--gpt-neox-20b/snapshots/4e49eadb5d14bd22f314ec3f45b69a87b88c7691/special_tokens_map.json",
7
+ "tokenizer_class": "GPTNeoXTokenizer",
8
+ "unk_token": "<|endoftext|>"
9
+ }