SystemAdmin123 commited on
Commit
c38e28b
·
verified ·
1 Parent(s): 3ae0bd2

Training in progress, step 200, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f2be77f4046d57162a2a1634e71c05173859bf5557783dfa12ea6e9468e051d
3
  size 723674912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39c3b834cf9097711f0f2aa3a630bfaed237e4d3c047f886943b7d264f08b96d
3
  size 723674912
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19b0ef4a865592b1c1398462392fee5da43bb5d95cb04ee8282d992c017e215b
3
  size 735625370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2174e639123eed1cb0a5141bbd6b84d6d9dc13c0802383f9c30c1c1f8eda9355
3
  size 735625370
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5179acd504f9caefc428bad8368a9feed783597605227f04c17ed5843af96dfc
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eccf36684d22a967cc11b19ade6c5b107783ceb47a439463ddecc8296fd8bf9
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d57da5f6b8845015897fecc79abf7ca6507809cfcf86ed0e80e8a671f77e231
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32507bbe816cbd0427cff7ac83a89a718c120d506907cf5a125998e66e6121c4
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2f8edafee3984ce0824458e1123790dbcab896cab979f7abfa8851dd911b81b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9b81926aa60404a196dbb989a6c6ee8f1074bab84733386986ddfa2847703b0
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:982ef26a1a303041dac26c15f97f86f53c622fcb36d57d2226e4c72f425873e3
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5374c1c7c5169dac1e64e286b9ca7aa3607197c4f7671202eddd71042127d0a
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:723432e9081dffbc4dea9b11807f9120cba5ae794b58bf13637161ca198c867f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca9a25c72339c898b564e0c464a3f6fc75bbeec408008928b7ed05533156b98c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 22.5,
5
  "eval_steps": 20,
6
- "global_step": 180,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -213,6 +213,28 @@
213
  "eval_samples_per_second": 300.65,
214
  "eval_steps_per_second": 3.405,
215
  "step": 180
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
216
  }
217
  ],
218
  "logging_steps": 10,
@@ -227,12 +249,12 @@
227
  "should_evaluate": false,
228
  "should_log": false,
229
  "should_save": true,
230
- "should_training_stop": false
231
  },
232
  "attributes": {}
233
  }
234
  },
235
- "total_flos": 6.402489065039462e+16,
236
  "train_batch_size": 23,
237
  "trial_name": null,
238
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 25.0,
5
  "eval_steps": 20,
6
+ "global_step": 200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
213
  "eval_samples_per_second": 300.65,
214
  "eval_steps_per_second": 3.405,
215
  "step": 180
216
+ },
217
+ {
218
+ "epoch": 23.75,
219
+ "grad_norm": 0.146484375,
220
+ "learning_rate": 1.3638696597277679e-06,
221
+ "loss": 2.0059,
222
+ "step": 190
223
+ },
224
+ {
225
+ "epoch": 25.0,
226
+ "grad_norm": 0.1318359375,
227
+ "learning_rate": 0.0,
228
+ "loss": 2.0109,
229
+ "step": 200
230
+ },
231
+ {
232
+ "epoch": 25.0,
233
+ "eval_loss": 2.0673062801361084,
234
+ "eval_runtime": 4.8758,
235
+ "eval_samples_per_second": 307.844,
236
+ "eval_steps_per_second": 3.487,
237
+ "step": 200
238
  }
239
  ],
240
  "logging_steps": 10,
 
249
  "should_evaluate": false,
250
  "should_log": false,
251
  "should_save": true,
252
+ "should_training_stop": true
253
  },
254
  "attributes": {}
255
  }
256
  },
257
+ "total_flos": 7.113876738932736e+16,
258
  "train_batch_size": 23,
259
  "trial_name": null,
260
  "trial_params": null