yusuke111 commited on
Commit
762593d
·
verified ·
1 Parent(s): 4716f87

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. config.json +1 -0
  2. model.safetensors +1 -1
  3. tokenizer.json +1 -1
  4. training_args.bin +1 -1
config.json CHANGED
@@ -23,6 +23,7 @@
23
  "num_attention_heads": 12,
24
  "num_hidden_layers": 12,
25
  "num_key_value_heads": 4,
 
26
  "pretraining_tp": 1,
27
  "rms_norm_eps": 1e-06,
28
  "rope_scaling": null,
 
23
  "num_attention_heads": 12,
24
  "num_hidden_layers": 12,
25
  "num_key_value_heads": 4,
26
+ "pad_token_id": 2,
27
  "pretraining_tp": 1,
28
  "rms_norm_eps": 1e-06,
29
  "rope_scaling": null,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e65f89b740d5fc1b17053bf10bfb5697b88c99ebfd1329f7f7f5dba48bf3469
3
  size 510960712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41b316cc55e9b2f3fd19820073b08e5091e6463c68fd1a56d5195d9a7a126a19
3
  size 510960712
tokenizer.json CHANGED
@@ -2,7 +2,7 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 1024,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 2048,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7841616dbb9991b2dfa72fc8aac885c7593967eddb16a303c8a222ad3a62f58d
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1165650bfd7557316d9924523f2b62c931aee2703a1455def4018ce87a6b423d
3
  size 5368