SystemAdmin123 commited on
Commit
b5b5894
·
verified ·
1 Parent(s): 18bf1e1

Training in progress, step 20, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6afd96f0a4efb226214a2f98fc2930b95faa7d2409bdbba1791318c01e36cad
3
  size 250490408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b50fab4df0857296b826fb533679d67b419acccbace03eded5bcde6b1019ad70
3
  size 250490408
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9766749cabbd0fe5ad2cb84cb5b1e21a853eda9b1ed07a7c96fd6bf1b05d3c04
3
  size 255265850
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5236e7bb1e866cd6476e6e3665a868ca0c865cc4d75c0b8f33b968041717090
3
  size 255265850
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0676c143653a967526628bc2f1d4644cea97dd18a780321d518070502832502d
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f0cd92d44290d6f6688c3ebd219b1a8e16a4fb3fc40ddaf684cb9273335ba6e
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:465d2d2aca677e6044b1b9bb8917a886a23650c3ce9b3ee9246d24ecb5324a05
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a20a1acb52cc6e9c17e6c90786f46e7d0ce02edfc6be15f78dd6f0e42dd5db2
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c747745535681b443a3cae9777675e8f1d7f8e4fdcc2e923572fbc2e7ee62ede
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:671e391807b0ab9b289ecea768661c20458f82abb5fff2f5b02536860d7df3aa
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9410529b5a855657bd3a08b9e2887f922f2b19dd1ea9123054c798d54f882e1
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:876b48ccbca60f6ef5833275c3979dd776f668d13202dfbd3055d06dd8704ebc
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a60c7d771c1fd156acee762fba03c724cb41829a3f71df370ecd1d20b134982
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84f22729b765b6841bd185712dd3ab8bf338866cd8396b5dce62f9950913691a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 16.666666666666668,
5
- "eval_steps": 200,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -11,87 +11,39 @@
11
  {
12
  "epoch": 0.16666666666666666,
13
  "eval_loss": 3.2664246559143066,
14
- "eval_runtime": 5.1158,
15
- "eval_samples_per_second": 293.406,
16
- "eval_steps_per_second": 2.346,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 1.6666666666666665,
21
- "grad_norm": 3.84375,
22
  "learning_rate": 0.00019863613034027224,
23
- "loss": 6.2672,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 3.3333333333333335,
28
- "grad_norm": 3.5,
29
  "learning_rate": 0.0001879473751206489,
30
- "loss": 5.5486,
31
  "step": 20
32
  },
33
  {
34
- "epoch": 5.0,
35
- "grad_norm": 2.71875,
36
- "learning_rate": 0.00016772815716257412,
37
- "loss": 5.2045,
38
- "step": 30
39
- },
40
- {
41
- "epoch": 6.666666666666667,
42
- "grad_norm": 3.03125,
43
- "learning_rate": 0.00014016954246529696,
44
- "loss": 5.0295,
45
- "step": 40
46
- },
47
- {
48
- "epoch": 8.333333333333334,
49
- "grad_norm": 4.25,
50
- "learning_rate": 0.00010825793454723325,
51
- "loss": 4.8139,
52
- "step": 50
53
- },
54
- {
55
- "epoch": 10.0,
56
- "grad_norm": 2.921875,
57
- "learning_rate": 7.54514512859201e-05,
58
- "loss": 4.6461,
59
- "step": 60
60
- },
61
- {
62
- "epoch": 11.666666666666666,
63
- "grad_norm": 2.34375,
64
- "learning_rate": 4.530518418775733e-05,
65
- "loss": 4.5564,
66
- "step": 70
67
- },
68
- {
69
- "epoch": 13.333333333333334,
70
- "grad_norm": 2.265625,
71
- "learning_rate": 2.1085949060360654e-05,
72
- "loss": 4.4932,
73
- "step": 80
74
- },
75
- {
76
- "epoch": 15.0,
77
- "grad_norm": 3.28125,
78
- "learning_rate": 5.418275829936537e-06,
79
- "loss": 4.4706,
80
- "step": 90
81
- },
82
- {
83
- "epoch": 16.666666666666668,
84
- "grad_norm": 1.953125,
85
- "learning_rate": 0.0,
86
- "loss": 4.4708,
87
- "step": 100
88
  }
89
  ],
90
  "logging_steps": 10,
91
  "max_steps": 100,
92
  "num_input_tokens_seen": 0,
93
  "num_train_epochs": 17,
94
- "save_steps": 200,
95
  "stateful_callbacks": {
96
  "TrainerControl": {
97
  "args": {
@@ -99,12 +51,12 @@
99
  "should_evaluate": false,
100
  "should_log": false,
101
  "should_save": true,
102
- "should_training_stop": true
103
  },
104
  "attributes": {}
105
  }
106
  },
107
- "total_flos": 1.2971582112661504e+16,
108
  "train_batch_size": 32,
109
  "trial_name": null,
110
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.3333333333333335,
5
+ "eval_steps": 20,
6
+ "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
11
  {
12
  "epoch": 0.16666666666666666,
13
  "eval_loss": 3.2664246559143066,
14
+ "eval_runtime": 5.3854,
15
+ "eval_samples_per_second": 278.716,
16
+ "eval_steps_per_second": 2.228,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 1.6666666666666665,
21
+ "grad_norm": 3.59375,
22
  "learning_rate": 0.00019863613034027224,
23
+ "loss": 6.2648,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 3.3333333333333335,
28
+ "grad_norm": 10.5625,
29
  "learning_rate": 0.0001879473751206489,
30
+ "loss": 5.5113,
31
  "step": 20
32
  },
33
  {
34
+ "epoch": 3.3333333333333335,
35
+ "eval_loss": 3.2161271572113037,
36
+ "eval_runtime": 5.2834,
37
+ "eval_samples_per_second": 284.095,
38
+ "eval_steps_per_second": 2.271,
39
+ "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  }
41
  ],
42
  "logging_steps": 10,
43
  "max_steps": 100,
44
  "num_input_tokens_seen": 0,
45
  "num_train_epochs": 17,
46
+ "save_steps": 20,
47
  "stateful_callbacks": {
48
  "TrainerControl": {
49
  "args": {
 
51
  "should_evaluate": false,
52
  "should_log": false,
53
  "should_save": true,
54
+ "should_training_stop": false
55
  },
56
  "attributes": {}
57
  }
58
  },
59
+ "total_flos": 2598287978790912.0,
60
  "train_batch_size": 32,
61
  "trial_name": null,
62
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91e32bef4fa18f7434f34b3ab9a59a991d12d4e7c7fd850b74f33c05529273df
3
  size 6840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1c609712c20122320b7a03274aeaded4a729690871dc722325e534970da288f
3
  size 6840