Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- added_tokens.json +24 -0
- config.json +28 -0
- generation_config.json +15 -0
- global_step80/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- global_step80/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"</tool_call>": 151658,
|
3 |
+
"<tool_call>": 151657,
|
4 |
+
"<|box_end|>": 151649,
|
5 |
+
"<|box_start|>": 151648,
|
6 |
+
"<|endoftext|>": 151643,
|
7 |
+
"<|file_sep|>": 151664,
|
8 |
+
"<|fim_middle|>": 151660,
|
9 |
+
"<|fim_pad|>": 151662,
|
10 |
+
"<|fim_prefix|>": 151659,
|
11 |
+
"<|fim_suffix|>": 151661,
|
12 |
+
"<|im_end|>": 151645,
|
13 |
+
"<|im_start|>": 151644,
|
14 |
+
"<|image_pad|>": 151655,
|
15 |
+
"<|object_ref_end|>": 151647,
|
16 |
+
"<|object_ref_start|>": 151646,
|
17 |
+
"<|quad_end|>": 151651,
|
18 |
+
"<|quad_start|>": 151650,
|
19 |
+
"<|repo_name|>": 151663,
|
20 |
+
"<|video_pad|>": 151656,
|
21 |
+
"<|vision_end|>": 151653,
|
22 |
+
"<|vision_pad|>": 151654,
|
23 |
+
"<|vision_start|>": 151652
|
24 |
+
}
|
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"Qwen2ForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_dropout": 0.0,
|
6 |
+
"bos_token_id": 151643,
|
7 |
+
"eos_token_id": 151645,
|
8 |
+
"hidden_act": "silu",
|
9 |
+
"hidden_size": 8192,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_size": 29568,
|
12 |
+
"max_position_embeddings": 32768,
|
13 |
+
"max_window_layers": 70,
|
14 |
+
"model_type": "qwen2",
|
15 |
+
"num_attention_heads": 64,
|
16 |
+
"num_hidden_layers": 80,
|
17 |
+
"num_key_value_heads": 8,
|
18 |
+
"rms_norm_eps": 1e-06,
|
19 |
+
"rope_scaling": null,
|
20 |
+
"rope_theta": 1000000.0,
|
21 |
+
"sliding_window": 131072,
|
22 |
+
"tie_word_embeddings": false,
|
23 |
+
"torch_dtype": "bfloat16",
|
24 |
+
"transformers_version": "4.51.3",
|
25 |
+
"use_cache": false,
|
26 |
+
"use_sliding_window": false,
|
27 |
+
"vocab_size": 152064
|
28 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
+
"max_new_tokens": 32768,
|
9 |
+
"pad_token_id": 151643,
|
10 |
+
"repetition_penalty": 1.05,
|
11 |
+
"temperature": 0.7,
|
12 |
+
"top_k": 20,
|
13 |
+
"top_p": 0.8,
|
14 |
+
"transformers_version": "4.51.3"
|
15 |
+
}
|
global_step80/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4ae143a17349aec4001bf9805fb661581098265562d4153376b647b73f0b944
|
3 |
+
size 1704056752
|
global_step80/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33791f8bcc5b7ba843d4a71a129c32c7937b74b62c95f8c79287aea47855698e
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92df70dbc7835ba55e730e988a5025e8f3ab531456705d34ca50f322ea36b2c8
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c414d166e484a5e303b01c4b2b86acafda89c1cdf933b5f35b0ab32292456b46
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3487ec1d943472b6e055470a58f451973e1ca5b803da980862e5ea23d84cd47c
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccd0e91915dc94b5f3dc809d6a342bf5a137eda8c44f45ae9e450bc32360349e
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92b43c774df7ea403b2f2e5434ddcd53b40897d9dcfe287892efcc6a1ca792a8
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fb6fa076c14d3c02412cc07dcec4134b15e32832c2c80c26f610ef0df0055f5
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a43ff64d71eef91f13176b57e83e4673e9c487ab59d79c0b9105b017194d305
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:239ea10e979bc072e4ea3b92009f67c903af7cd47c34505d96deeb3453315375
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39ceee2a1168bf686a11011fbb3615286dbee8de86b4cc2eb5684a6e3ff96b9a
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29695fbcd3e5bc21cd4e543f5782022012a71222798f4b14261c3ed429b22c22
|
3 |
+
size 1704056764
|
global_step80/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:621e52aa7cda3521f9af9a8ec444318697e7c4bd0af85988efca36868e534e89
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6193e11932ddcb4ccfb8118c73cb600cbf065f01614a3418ca6c32993ff9c59a
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:000169c6abb3b28d50b4069b85e5b5e54a0b2af9aacaedbe27250a0c6e03cc5b
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a69239313cc031d3a9b96f4ca3088feb191dc0d5513656a2b16adabc4fb1e978
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7192f44be1b8455c06f68603ae5104faf24cec9a286483e6510005b10ef9abbd
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:152fa8701e57ee3cdbc120b1a672d2faa9877b246ba3ecbc665ab8a57710b09f
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ca53bc9a9020cbf12f2cf769da605668fb4c90a3b37fa8bfb4d7c32f6480ed2
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f69557aaccb00cb89cc1b0fcf15a7b5ad742342558846e7114548f89459f671
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aea1dbbd7c99c75ae4000523070125324c2a48649ae559ccf78c565ada4cb19b
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1954373b458e2af404c05aac9796f97d3e973005730b3204629ce9a476e93319
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba49f2daa2ce0e5c8ff50792829a60b06a059424ae333c7162684fd2706f5b37
|
3 |
+
size 1704056764
|
global_step80/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a87357293e32e3ff0ba19b88412c0477fc80572da7011f8f39fd374fcb91781
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96c772c82166f81c81edf9066a4f4b9d717c37f0c91579c3ddf87b76f5ba01a9
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f6ddd68fb42eb46b1f1c4176f4de813ae1b0232bef56c28ece592e1aaac18dd
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31bbdca04fb85777bc11b61caffce29b3dce2ee5eda944b487444d944d87ddaf
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17e483e7b7b1cdfb9f961cfda93db043b33dabdcdd98a7d9a2402903d681149f
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0ae06607480b365997033e356976e8202deb1721ccc33d17112a5c6ebab6da5
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45ca1730ac8e04bdf959183a2e010a9fba0a1ad4f03a1cb967c4604c3a73d12e
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1caca6bfce645be876b06d200f175296135af7f4ec361f6f7a7c3658f1a47988
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d23ae3800b37a1dd42b71f565a1029f1bb622d58540c2423b236ddffd13249a4
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b55c7d279834a021d171658d2e6b5bf00538d4a767da43bd6de0d3e4d1a7a44e
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b152be49a276a03377ad8cb29bbbbb1355f88e76f4f151b30b6ffba2fc21ff06
|
3 |
+
size 1704056764
|
global_step80/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e37dc290c4a33bbfb8b0406df1123b2a7e88f10e9a2a65e1529298a2e218ebf5
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6603aade3025a15e9f3ccd9c01d9af84d8f1bf6c643e67a784df3555a4225a99
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:281308d01eea8c231e91c8b6638f43b0d5e5db708f056b85a1a5f917f8cb4bf8
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:500a1a498ec590c95e21f7a55a1235172043dea0a18fda43ae4118777da9c96d
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9691d12641e701d7bbaa7f6277570e01c7038d9f36ae3ac1a1562d0603a6bf3e
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daf77c22dc00d6b3589b1bfc5f1c67784f6c5319cfe0a81e3c82b3555ba58b80
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beffaf00d5ab779d31d41c3c477f13cb9f2fce6a9fe1a3710a9789e65826ee1c
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:745b892c34c9dedfc9c8bf4c51972295da5d6fe6f72694b4e38e5adfaeedcb32
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6545bd2f46e844f0983c163a3d8a1d10e57d89ddfece7bfac884366eec919f1
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:feed46c7aebff3ae707691d4d332d9e040966d923bac452a2b3669d9a4909409
|
3 |
+
size 1704056776
|
global_step80/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60a93f5af1f742072182582c9ea24b77ffd4caaddcf6fa44a2379869133598c0
|
3 |
+
size 1704056764
|
global_step80/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41c686f536d116c6df82572b12c6900f1f6bcdf0677170a57be1b9c8c4674c2d
|
3 |
+
size 1704056776
|