upload model
Browse files- .gitattributes +18 -0
- added_tokens.json +3 -0
- chat_template.jinja +3 -0
- config.json +3 -0
- generation_config.json +3 -0
- global_step16000/.gitattributes +8 -0
- global_step16000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- global_step16000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- global_step16000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- global_step16000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- global_step16000/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- global_step16000/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- global_step16000/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- global_step16000/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- latest +3 -0
- merges.txt +3 -0
- rng_state_0.pth +3 -0
- rng_state_1.pth +3 -0
- rng_state_2.pth +3 -0
- rng_state_3.pth +3 -0
- scheduler.pt +3 -0
- special_tokens_map.json +3 -0
- tokenizer_config.json +3 -0
- trainer_state.json +3 -0
- training_args.bin +3 -0
- vocab.json +3 -0
- zero_to_fp32.py +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,21 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
rng_state_3.pth filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
latest filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
rng_state_0.pth filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
rng_state_2.pth filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
rng_state_1.pth filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
scheduler.pt filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
special_tokens_map.json filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
vocab.json filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
chat_template.jinja filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
generation_config.json filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
merges.txt filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
zero_to_fp32.py filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
training_args.bin filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
added_tokens.json filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
config.json filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
global_step16000 filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b
|
| 3 |
+
size 605
|
chat_template.jinja
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd8e9439f0570856fd70470bf8889ebd8b5d1107207f67a5efb46e342330527f
|
| 3 |
+
size 2507
|
config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ebeb2c8c5b579645b34f43a9192d77e869763cc4a71f16515a0d6661b6a6fc6e
|
| 3 |
+
size 1325
|
generation_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca471b4abe1283087b4f5b260b9512e084b88c106b984db639302ca07fb823ea
|
| 3 |
+
size 143
|
global_step16000/.gitattributes
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
zero_pp_rank_0_mp_rank_00_model_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
zero_pp_rank_1_mp_rank_00_model_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
zero_pp_rank_2_mp_rank_00_model_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
zero_pp_rank_3_mp_rank_00_model_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt filter=lfs diff=lfs merge=lfs -text
|
global_step16000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce683f404edb1c197836049f66aedf573963dccf3bb79bf1a94af689dec94b6d
|
| 3 |
+
size 22846856147
|
global_step16000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f7c79133560d1dfb77f3ce4f0e527c3a4cbd5dc5c93808d4e2889b426ee0264
|
| 3 |
+
size 22846856147
|
global_step16000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9fc863c14b18a2ac2ed85dba99490da98df69058b1832d2053620d32e6ac9de
|
| 3 |
+
size 22846856147
|
global_step16000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f9b7aa7fd926f46d569a35beadf07ec898de93bdeb7f892406be830f4e78442a
|
| 3 |
+
size 22846856147
|
global_step16000/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf57470c7cba6bba7d2050bee5414fb25808faee9e8d71a201c71fac5044c9cf
|
| 3 |
+
size 174112
|
global_step16000/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:668783ded16f8cc0ac6821d74e81ee53ba96f5fa88850f4dbc7e46d31091f4e6
|
| 3 |
+
size 174112
|
global_step16000/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:104ebe1ac3531dc2f86a61246f236c70ab610a3c5836e00d7ef2ae26ab28a7c2
|
| 3 |
+
size 174112
|
global_step16000/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33592e333f6b3e834c9846cdca59b0fdc9f97a4178f54b0634d83ee9188b47f5
|
| 3 |
+
size 174112
|
latest
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:244601971f0ff5b49377c4ed77323417c7b021b830a87cbfe82331a031d8e6d3
|
| 3 |
+
size 16
|
merges.txt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5
|
| 3 |
+
size 1671853
|
rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fe6b873f1da64bb980afe982fc1c6b6bc461ad8c33073d856804323f64b26d9
|
| 3 |
+
size 15429
|
rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13db4dd10b22b5464f5ef0b539152b46390eae6a827b355108cb54b1af2eb830
|
| 3 |
+
size 15429
|
rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06e293f13fb6e873e8081636b6b07115410b397c55f1ed08b8772b059c8eb74e
|
| 3 |
+
size 15429
|
rng_state_3.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c595c077664f94b7f91088561951be20e39483e01865774a83bc46f3971a3152
|
| 3 |
+
size 15429
|
scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd4678f15aaba367ef8b645c445105c6d4d7feab0cb33e2ce7651846307aca90
|
| 3 |
+
size 1401
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd
|
| 3 |
+
size 613
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f06d54777a4c59c23ed608b2529c49f6a66853df9bc8a254d52eeb3b99d7c827
|
| 3 |
+
size 4712
|
trainer_state.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2666c0489b52b9234d7ebb53a946b4c9ded033a3adad639c87ae4c9be8a38c27
|
| 3 |
+
size 280292
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b218b9da0a7ad738f3bbfe41d4654d531f153b9dae589558b832df6c05948f56
|
| 3 |
+
size 6161
|
vocab.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87a257b04b17642a0688c98cd1df89c398bda4fee532d6f88b38a659ecb4ac8d
|
| 3 |
+
size 3383407
|
zero_to_fp32.py
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46497565ccf2b4a8b1f6f18c8341042f3749605a94335c81f69df1bd268af64f
|
| 3 |
+
size 33272
|