Training in progress, step 11000
Browse files
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1527847357
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4868625229d9fb4f59be3dcf4ee4d625a4c4d8f8c962c331665c42153a7110e4
|
3 |
size 1527847357
|
run.sh
CHANGED
@@ -15,8 +15,8 @@ deepspeed run-ba.py \
|
|
15 |
--torch_compile_mode="max-autotune" \
|
16 |
--logging_steps="25" \
|
17 |
--learning_rate="3e-6" \
|
18 |
-
--max_steps="
|
19 |
-
--resume_from_checkpoint="checkpoint-
|
20 |
--output_dir="./" \
|
21 |
--per_device_train_batch_size="32" \
|
22 |
--gradient_accumulation_steps="1" \
|
|
|
15 |
--torch_compile_mode="max-autotune" \
|
16 |
--logging_steps="25" \
|
17 |
--learning_rate="3e-6" \
|
18 |
+
--max_steps="11000" \
|
19 |
+
--resume_from_checkpoint="checkpoint-10000" \
|
20 |
--output_dir="./" \
|
21 |
--per_device_train_batch_size="32" \
|
22 |
--gradient_accumulation_steps="1" \
|
runs/Dec23_11-21-18_129-146-176-120/1671794528.1170628/events.out.tfevents.1671794528.129-146-176-120.862675.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91183f09174edb6bca2a73cd1d787b5148ae412a33f875166e6927fe027cff39
|
3 |
+
size 5905
|
runs/Dec23_11-21-18_129-146-176-120/events.out.tfevents.1671794528.129-146-176-120.862675.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9043e8bad25dce879a345f1d50650eb203ab4c6b86c9d66afa9ce6206857057e
|
3 |
+
size 10915
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4795
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86bd2dc3474b0ea4e7cee91137714d1f7f9bf74cbda3424c891422badde5ccaf
|
3 |
size 4795
|