Training in progress, step 18, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c8d90ce71f70e4548f934bee353d1b76d22f88668d5dc88df6b122b99885648d
 size 41581360

 version https://git-lfs.github.com/spec/v1
+oid sha256:9679997ddbdf0aaf7627479ba9934040206c7023c174467ec71ba915828794d9
 size 41581360

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7281aaafd558e1d7307161de63ee215d13e38d97d952cac2edcc6415584af2b9
 size 21505540

 version https://git-lfs.github.com/spec/v1
+oid sha256:9040522376779c7a31146707300519e8d7d39213046e9f2cf4bbc480fe1e61aa
 size 21505540

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e81704244b251f91bf02d5375a081f6de3b738df32dce1d0130102aaca80ece0
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:63236f8023b6c36bd0a9ae3afc0a7c5229575e92a00da93efffa78dfd33bdc3d
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e555b1173ceea1f11ca45539c0fe5856e7571df97c436cc742ba6deb19b07e97
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd82e2c4dd46a0c4163e78a1bb05a9e321fb40a1c884136f2f4f92fe2449cbde
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8759124087591241,
   "eval_steps": 4,
-  "global_step": 15,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -46,6 +46,14 @@
       "eval_samples_per_second": 33.624,
       "eval_steps_per_second": 4.348,
       "step": 12
     }
   ],
   "logging_steps": 10,
@@ -60,12 +68,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 1.2352404068499456e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.051094890510949,
   "eval_steps": 4,
+  "global_step": 18,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 33.624,
       "eval_steps_per_second": 4.348,
       "step": 12
+    },
+    {
+      "epoch": 0.9343065693430657,
+      "eval_loss": 1.3059964179992676,
+      "eval_runtime": 3.4569,
+      "eval_samples_per_second": 33.556,
+      "eval_steps_per_second": 4.339,
+      "step": 16
     }
   ],
   "logging_steps": 10,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 1.4902900455112704e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null