AnzeXie commited on
Commit
4feb7f1
·
verified ·
1 Parent(s): 63c8ab9

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. added_tokens.json +24 -0
  3. config.json +28 -0
  4. generation_config.json +15 -0
  5. global_step80/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  6. global_step80/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt +3 -0
  7. global_step80/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt +3 -0
  8. global_step80/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt +3 -0
  9. global_step80/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt +3 -0
  10. global_step80/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt +3 -0
  11. global_step80/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt +3 -0
  12. global_step80/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt +3 -0
  13. global_step80/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt +3 -0
  14. global_step80/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt +3 -0
  15. global_step80/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt +3 -0
  16. global_step80/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  17. global_step80/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt +3 -0
  18. global_step80/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt +3 -0
  19. global_step80/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt +3 -0
  20. global_step80/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt +3 -0
  21. global_step80/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt +3 -0
  22. global_step80/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt +3 -0
  23. global_step80/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt +3 -0
  24. global_step80/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt +3 -0
  25. global_step80/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt +3 -0
  26. global_step80/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt +3 -0
  27. global_step80/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  28. global_step80/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt +3 -0
  29. global_step80/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt +3 -0
  30. global_step80/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt +3 -0
  31. global_step80/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt +3 -0
  32. global_step80/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt +3 -0
  33. global_step80/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt +3 -0
  34. global_step80/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt +3 -0
  35. global_step80/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt +3 -0
  36. global_step80/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt +3 -0
  37. global_step80/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt +3 -0
  38. global_step80/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  39. global_step80/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt +3 -0
  40. global_step80/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt +3 -0
  41. global_step80/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt +3 -0
  42. global_step80/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt +3 -0
  43. global_step80/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt +3 -0
  44. global_step80/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt +3 -0
  45. global_step80/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt +3 -0
  46. global_step80/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt +3 -0
  47. global_step80/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt +3 -0
  48. global_step80/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt +3 -0
  49. global_step80/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  50. global_step80/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</tool_call>": 151658,
3
+ "<tool_call>": 151657,
4
+ "<|box_end|>": 151649,
5
+ "<|box_start|>": 151648,
6
+ "<|endoftext|>": 151643,
7
+ "<|file_sep|>": 151664,
8
+ "<|fim_middle|>": 151660,
9
+ "<|fim_pad|>": 151662,
10
+ "<|fim_prefix|>": 151659,
11
+ "<|fim_suffix|>": 151661,
12
+ "<|im_end|>": 151645,
13
+ "<|im_start|>": 151644,
14
+ "<|image_pad|>": 151655,
15
+ "<|object_ref_end|>": 151647,
16
+ "<|object_ref_start|>": 151646,
17
+ "<|quad_end|>": 151651,
18
+ "<|quad_start|>": 151650,
19
+ "<|repo_name|>": 151663,
20
+ "<|video_pad|>": 151656,
21
+ "<|vision_end|>": 151653,
22
+ "<|vision_pad|>": 151654,
23
+ "<|vision_start|>": 151652
24
+ }
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen2ForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 151643,
7
+ "eos_token_id": 151645,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 8192,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 29568,
12
+ "max_position_embeddings": 32768,
13
+ "max_window_layers": 70,
14
+ "model_type": "qwen2",
15
+ "num_attention_heads": 64,
16
+ "num_hidden_layers": 80,
17
+ "num_key_value_heads": 8,
18
+ "rms_norm_eps": 1e-06,
19
+ "rope_scaling": null,
20
+ "rope_theta": 1000000.0,
21
+ "sliding_window": 131072,
22
+ "tie_word_embeddings": false,
23
+ "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.51.3",
25
+ "use_cache": false,
26
+ "use_sliding_window": false,
27
+ "vocab_size": 152064
28
+ }
generation_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "max_new_tokens": 32768,
9
+ "pad_token_id": 151643,
10
+ "repetition_penalty": 1.05,
11
+ "temperature": 0.7,
12
+ "top_k": 20,
13
+ "top_p": 0.8,
14
+ "transformers_version": "4.51.3"
15
+ }
global_step80/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4ae143a17349aec4001bf9805fb661581098265562d4153376b647b73f0b944
3
+ size 1704056752
global_step80/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33791f8bcc5b7ba843d4a71a129c32c7937b74b62c95f8c79287aea47855698e
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92df70dbc7835ba55e730e988a5025e8f3ab531456705d34ca50f322ea36b2c8
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c414d166e484a5e303b01c4b2b86acafda89c1cdf933b5f35b0ab32292456b46
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3487ec1d943472b6e055470a58f451973e1ca5b803da980862e5ea23d84cd47c
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd0e91915dc94b5f3dc809d6a342bf5a137eda8c44f45ae9e450bc32360349e
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92b43c774df7ea403b2f2e5434ddcd53b40897d9dcfe287892efcc6a1ca792a8
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fb6fa076c14d3c02412cc07dcec4134b15e32832c2c80c26f610ef0df0055f5
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a43ff64d71eef91f13176b57e83e4673e9c487ab59d79c0b9105b017194d305
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:239ea10e979bc072e4ea3b92009f67c903af7cd47c34505d96deeb3453315375
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39ceee2a1168bf686a11011fbb3615286dbee8de86b4cc2eb5684a6e3ff96b9a
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29695fbcd3e5bc21cd4e543f5782022012a71222798f4b14261c3ed429b22c22
3
+ size 1704056764
global_step80/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:621e52aa7cda3521f9af9a8ec444318697e7c4bd0af85988efca36868e534e89
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6193e11932ddcb4ccfb8118c73cb600cbf065f01614a3418ca6c32993ff9c59a
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:000169c6abb3b28d50b4069b85e5b5e54a0b2af9aacaedbe27250a0c6e03cc5b
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a69239313cc031d3a9b96f4ca3088feb191dc0d5513656a2b16adabc4fb1e978
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7192f44be1b8455c06f68603ae5104faf24cec9a286483e6510005b10ef9abbd
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:152fa8701e57ee3cdbc120b1a672d2faa9877b246ba3ecbc665ab8a57710b09f
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ca53bc9a9020cbf12f2cf769da605668fb4c90a3b37fa8bfb4d7c32f6480ed2
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f69557aaccb00cb89cc1b0fcf15a7b5ad742342558846e7114548f89459f671
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aea1dbbd7c99c75ae4000523070125324c2a48649ae559ccf78c565ada4cb19b
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1954373b458e2af404c05aac9796f97d3e973005730b3204629ce9a476e93319
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba49f2daa2ce0e5c8ff50792829a60b06a059424ae333c7162684fd2706f5b37
3
+ size 1704056764
global_step80/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a87357293e32e3ff0ba19b88412c0477fc80572da7011f8f39fd374fcb91781
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96c772c82166f81c81edf9066a4f4b9d717c37f0c91579c3ddf87b76f5ba01a9
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f6ddd68fb42eb46b1f1c4176f4de813ae1b0232bef56c28ece592e1aaac18dd
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31bbdca04fb85777bc11b61caffce29b3dce2ee5eda944b487444d944d87ddaf
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17e483e7b7b1cdfb9f961cfda93db043b33dabdcdd98a7d9a2402903d681149f
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0ae06607480b365997033e356976e8202deb1721ccc33d17112a5c6ebab6da5
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45ca1730ac8e04bdf959183a2e010a9fba0a1ad4f03a1cb967c4604c3a73d12e
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1caca6bfce645be876b06d200f175296135af7f4ec361f6f7a7c3658f1a47988
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d23ae3800b37a1dd42b71f565a1029f1bb622d58540c2423b236ddffd13249a4
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b55c7d279834a021d171658d2e6b5bf00538d4a767da43bd6de0d3e4d1a7a44e
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b152be49a276a03377ad8cb29bbbbb1355f88e76f4f151b30b6ffba2fc21ff06
3
+ size 1704056764
global_step80/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e37dc290c4a33bbfb8b0406df1123b2a7e88f10e9a2a65e1529298a2e218ebf5
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6603aade3025a15e9f3ccd9c01d9af84d8f1bf6c643e67a784df3555a4225a99
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:281308d01eea8c231e91c8b6638f43b0d5e5db708f056b85a1a5f917f8cb4bf8
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:500a1a498ec590c95e21f7a55a1235172043dea0a18fda43ae4118777da9c96d
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9691d12641e701d7bbaa7f6277570e01c7038d9f36ae3ac1a1562d0603a6bf3e
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daf77c22dc00d6b3589b1bfc5f1c67784f6c5319cfe0a81e3c82b3555ba58b80
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beffaf00d5ab779d31d41c3c477f13cb9f2fce6a9fe1a3710a9789e65826ee1c
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:745b892c34c9dedfc9c8bf4c51972295da5d6fe6f72694b4e38e5adfaeedcb32
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6545bd2f46e844f0983c163a3d8a1d10e57d89ddfece7bfac884366eec919f1
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:feed46c7aebff3ae707691d4d332d9e040966d923bac452a2b3669d9a4909409
3
+ size 1704056776
global_step80/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60a93f5af1f742072182582c9ea24b77ffd4caaddcf6fa44a2379869133598c0
3
+ size 1704056764
global_step80/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41c686f536d116c6df82572b12c6900f1f6bcdf0677170a57be1b9c8c4674c2d
3
+ size 1704056776