yosefw commited on
Commit
c8c9b11
·
verified ·
1 Parent(s): 0f19ddc

Training in progress, step 500

Browse files
config.json CHANGED
@@ -25,7 +25,7 @@
25
  "rope_theta": 10000.0,
26
  "tie_word_embeddings": true,
27
  "torch_dtype": "float32",
28
- "transformers_version": "4.49.0",
29
  "use_cache": true,
30
  "vocab_size": 32002
31
  }
 
25
  "rope_theta": 10000.0,
26
  "tie_word_embeddings": true,
27
  "torch_dtype": "float32",
28
+ "transformers_version": "4.45.0",
29
  "use_cache": true,
30
  "vocab_size": 32002
31
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c177e501c14664d07d484f37f6b1ce28486c3ab71b98078b7d00b34235a115ae
3
  size 1650139320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22bcd59ed7a5f00c77add3504bc711437d4a2ffa1655fe6290f44f26f3de6a02
3
  size 1650139320
runs/Mar01_11-18-35_8a02e0a9a63c/events.out.tfevents.1740827938.8a02e0a9a63c.21.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca0b15a46a15cabbe7eac2a9968aba4ac9357faf93bdd36ae56f0d94a91e5d53
3
+ size 6251
special_tokens_map.json CHANGED
@@ -17,5 +17,5 @@
17
  ],
18
  "bos_token": "<|im_start|>",
19
  "eos_token": "<|im_end|>",
20
- "pad_token": "<|im_end|>"
21
  }
 
17
  ],
18
  "bos_token": "<|im_start|>",
19
  "eos_token": "<|im_end|>",
20
+ "pad_token": "<|end_of_text|>"
21
  }
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 256,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
tokenizer_config.json CHANGED
@@ -2079,6 +2079,6 @@
2079
  "attention_mask"
2080
  ],
2081
  "model_max_length": 131072,
2082
- "pad_token": "<|im_end|>",
2083
- "tokenizer_class": "PreTrainedTokenizer"
2084
  }
 
2079
  "attention_mask"
2080
  ],
2081
  "model_max_length": 131072,
2082
+ "pad_token": "<|end_of_text|>",
2083
+ "tokenizer_class": "PreTrainedTokenizerFast"
2084
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bd00b62f35c925fb0005c897a90a061271d9ec160ff4f7dc68613345ff3bd70
3
- size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9efd98ef46ff56db0f8221aea744a03ebc708faa2d971e3ee13380034461705c
3
+ size 5496