duyphu commited on
Commit
8278a57
·
verified ·
1 Parent(s): 5453501

Training in progress, step 11, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:298134d4c8dffddc6bd0ca2789f713703e093aba625780c0df959e434b690184
3
  size 41459700
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eae9b60084574f9331adbe4747545ca28607ee03a912dabed33af0ef030912a
3
  size 41459700
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b138580fd1455e247dfc8e822f1b487e5eb2e008976b6c875eb6f11c4c9bc8e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bcc4d2409840b1b127474e2ae7677766647f6c0542890047c33ededad636de4
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1eca0ddb3ec890c90e8e6e7325bec40cdb8b59e4bebf5c0da8473b02809de875
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4968f693466c40cb971e90a0117e2a9be84fd1e9f8d5d00ed1cc54675e5c78ec
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.8372093023255814,
5
  "eval_steps": 3,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -46,6 +46,13 @@
46
  "eval_samples_per_second": 16.838,
47
  "eval_steps_per_second": 10.103,
48
  "step": 9
 
 
 
 
 
 
 
49
  }
50
  ],
51
  "logging_steps": 5,
@@ -60,12 +67,12 @@
60
  "should_evaluate": false,
61
  "should_log": false,
62
  "should_save": true,
63
- "should_training_stop": false
64
  },
65
  "attributes": {}
66
  }
67
  },
68
- "total_flos": 1568372441481216.0,
69
  "train_batch_size": 2,
70
  "trial_name": null,
71
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.069767441860465,
5
  "eval_steps": 3,
6
+ "global_step": 11,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
46
  "eval_samples_per_second": 16.838,
47
  "eval_steps_per_second": 10.103,
48
  "step": 9
49
+ },
50
+ {
51
+ "epoch": 0.9302325581395349,
52
+ "grad_norm": NaN,
53
+ "learning_rate": 0.0001,
54
+ "loss": 0.0,
55
+ "step": 10
56
  }
57
  ],
58
  "logging_steps": 5,
 
67
  "should_evaluate": false,
68
  "should_log": false,
69
  "should_save": true,
70
+ "should_training_stop": true
71
  },
72
  "attributes": {}
73
  }
74
  },
75
+ "total_flos": 1916899650699264.0,
76
  "train_batch_size": 2,
77
  "trial_name": null,
78
  "trial_params": null