oyxy2019 commited on
Commit
dd39764
·
1 Parent(s): 4b0084c

Training in progress, step 500

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[PAD]": 50257
3
+ }
config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "IDEA-CCNL/Wenzhong-GPT2-110M",
3
+ "activation_function": "gelu_fast",
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "initializer_range": 0.02,
12
+ "layer_norm_epsilon": 1e-05,
13
+ "model_type": "gpt2",
14
+ "n_ctx": 1024,
15
+ "n_embd": 768,
16
+ "n_head": 12,
17
+ "n_inner": 3072,
18
+ "n_layer": 12,
19
+ "n_positions": 1024,
20
+ "reorder_and_upcast_attn": false,
21
+ "resid_pdrop": 0.1,
22
+ "scale_attn_by_inverse_layer_idx": false,
23
+ "scale_attn_weights": true,
24
+ "summary_activation": null,
25
+ "summary_first_dropout": 0.1,
26
+ "summary_proj_to_labels": true,
27
+ "summary_type": "cls_index",
28
+ "summary_use_proj": true,
29
+ "tokenizer_class": "GPT2TokenizerFast",
30
+ "torch_dtype": "float32",
31
+ "transformers_version": "4.28.1",
32
+ "use_cache": true,
33
+ "vocab_size": 50258
34
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea569aa7c27a94afa2509340ebab964e23b21c8d1f3ba48f898db665e12a1aa8
3
+ size 510401085
runs/May01_08-47-25_node13/1682930853.3170443/events.out.tfevents.1682930853.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d91559f279e2cbe966e1b55e1c1cae68d04761d79f3c42b0a7f6269df1e3384
3
+ size 5603
runs/May01_08-47-25_node13/events.out.tfevents.1682930853.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f73a5e58c224e10d582126fa8e71179f1030df88a8ca59bf3b81eb9606b2bcac
3
+ size 4172
runs/May01_08-50-18_node13/1682931023.6832337/events.out.tfevents.1682931023.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e70c19f1f363272770b289160495b7738d611a9d2feb13f76b6806f532aa9ea8
3
+ size 5603
runs/May01_08-50-18_node13/events.out.tfevents.1682931023.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bebb955edc812b0cf2962ffcb381d2d82c24d218fb9b309914950f2f8e5f2511
3
+ size 4172
runs/May01_12-41-55_node13/1682944920.765208/events.out.tfevents.1682944920.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b52f199db2842989370e1e60ca9003ed5cadae3af525467f3bc3d8ac517a1bd
3
+ size 5603
runs/May01_12-41-55_node13/events.out.tfevents.1682944920.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4740683686d1b09e753046dbd1eb01aaad3a7b3ccf2bd46015b09810c4d7e1d
3
+ size 4172
runs/May01_15-10-20_node13/1682953825.8277748/events.out.tfevents.1682953825.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8366b6372a0f977a48065a974c629b447b19b6d9c75a63797af36e31123ef6b6
3
+ size 5603
runs/May01_15-10-20_node13/events.out.tfevents.1682953825.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abd99b2be241a4d7d5463b3eb7ad5264d2a21d2e788f2cd7a7c7f4b9e941f554
3
+ size 4172
runs/May01_15-14-22_node13/1682954067.9161758/events.out.tfevents.1682954067.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d70adfbbd93a583500febfc367943f0a0fb369473ab02ef625f71a392cd11b1b
3
+ size 5603
runs/May01_15-14-22_node13/events.out.tfevents.1682954067.node13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eac22c5bfba65b8cef8a56e07fcb05a73dee9ed737ad2df5caf5e25e3d80bdb
3
+ size 4172
special_tokens_map.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<|endoftext|>",
3
+ "eos_token": "<|endoftext|>",
4
+ "pad_token": "<|endoftext|>",
5
+ "unk_token": "<|endoftext|>"
6
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": false,
3
+ "add_prefix_space": false,
4
+ "bos_token": {
5
+ "__type": "AddedToken",
6
+ "content": "<|endoftext|>",
7
+ "lstrip": false,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "clean_up_tokenization_spaces": true,
13
+ "eos_token": {
14
+ "__type": "AddedToken",
15
+ "content": "<|endoftext|>",
16
+ "lstrip": false,
17
+ "normalized": true,
18
+ "rstrip": false,
19
+ "single_word": false
20
+ },
21
+ "errors": "replace",
22
+ "model_max_length": 1024,
23
+ "pad_token": null,
24
+ "tokenizer_class": "GPT2Tokenizer",
25
+ "unk_token": {
26
+ "__type": "AddedToken",
27
+ "content": "<|endoftext|>",
28
+ "lstrip": false,
29
+ "normalized": true,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ }
33
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:394085eb8bbcb95faddad939ecad0528ea2408cb361f7b47a48cb0eaba8a0e0c
3
+ size 3643
vocab.json ADDED
The diff for this file is too large to render. See raw diff