berkayaltntas commited on
Commit
5f19b2b
·
verified ·
1 Parent(s): 4e36c0e

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d6049f164c1f58adc56337d7065065dbec54afb91cdaafe09656ceb9f570a673
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:323ace2db6bab1e6e929d5b595b5250337041d498d57a05f760f17c5e956f2e4
3
  size 437958648
run-0/checkpoint-156/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_global_step": 78,
3
- "best_metric": 0.4729241877256318,
4
- "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-78",
5
  "epoch": 2.0,
6
  "eval_steps": 500,
7
  "global_step": 156,
@@ -11,20 +11,20 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.4729241877256318,
15
- "eval_loss": 0.7100459933280945,
16
- "eval_runtime": 0.6584,
17
- "eval_samples_per_second": 420.731,
18
- "eval_steps_per_second": 7.594,
19
  "step": 78
20
  },
21
  {
22
  "epoch": 2.0,
23
- "eval_accuracy": 0.4693140794223827,
24
- "eval_loss": 0.7023970484733582,
25
- "eval_runtime": 0.6667,
26
- "eval_samples_per_second": 415.458,
27
- "eval_steps_per_second": 7.499,
28
  "step": 156
29
  }
30
  ],
@@ -49,9 +49,9 @@
49
  "train_batch_size": 32,
50
  "trial_name": null,
51
  "trial_params": {
52
- "classifier_dropout": 0.4312273582787619,
53
- "learning_rate": 2.007242870680699e-06,
54
- "max_length": 256,
55
  "num_train_epochs": 3,
56
  "per_device_train_batch_size": 32
57
  }
 
1
  {
2
+ "best_global_step": 156,
3
+ "best_metric": 0.631768953068592,
4
+ "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-156",
5
  "epoch": 2.0,
6
  "eval_steps": 500,
7
  "global_step": 156,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.49097472924187724,
15
+ "eval_loss": 0.7057711482048035,
16
+ "eval_runtime": 0.6548,
17
+ "eval_samples_per_second": 423.062,
18
+ "eval_steps_per_second": 7.636,
19
  "step": 78
20
  },
21
  {
22
  "epoch": 2.0,
23
+ "eval_accuracy": 0.631768953068592,
24
+ "eval_loss": 0.6515233516693115,
25
+ "eval_runtime": 0.6593,
26
+ "eval_samples_per_second": 420.154,
27
+ "eval_steps_per_second": 7.584,
28
  "step": 156
29
  }
30
  ],
 
49
  "train_batch_size": 32,
50
  "trial_name": null,
51
  "trial_params": {
52
+ "classifier_dropout": 0.24469588923063107,
53
+ "learning_rate": 1.632929904930613e-05,
54
+ "max_length": 512,
55
  "num_train_epochs": 3,
56
  "per_device_train_batch_size": 32
57
  }
run-0/checkpoint-234/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_global_step": 78,
3
- "best_metric": 0.4729241877256318,
4
- "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-78",
5
  "epoch": 3.0,
6
  "eval_steps": 500,
7
  "global_step": 234,
@@ -11,29 +11,29 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.4729241877256318,
15
- "eval_loss": 0.7100459933280945,
16
- "eval_runtime": 0.6584,
17
- "eval_samples_per_second": 420.731,
18
- "eval_steps_per_second": 7.594,
19
  "step": 78
20
  },
21
  {
22
  "epoch": 2.0,
23
- "eval_accuracy": 0.4693140794223827,
24
- "eval_loss": 0.7023970484733582,
25
- "eval_runtime": 0.6667,
26
- "eval_samples_per_second": 415.458,
27
- "eval_steps_per_second": 7.499,
28
  "step": 156
29
  },
30
  {
31
  "epoch": 3.0,
32
- "eval_accuracy": 0.4693140794223827,
33
- "eval_loss": 0.7006211876869202,
34
- "eval_runtime": 0.6634,
35
- "eval_samples_per_second": 417.544,
36
- "eval_steps_per_second": 7.537,
37
  "step": 234
38
  }
39
  ],
@@ -58,9 +58,9 @@
58
  "train_batch_size": 32,
59
  "trial_name": null,
60
  "trial_params": {
61
- "classifier_dropout": 0.4312273582787619,
62
- "learning_rate": 2.007242870680699e-06,
63
- "max_length": 256,
64
  "num_train_epochs": 3,
65
  "per_device_train_batch_size": 32
66
  }
 
1
  {
2
+ "best_global_step": 234,
3
+ "best_metric": 0.6425992779783394,
4
+ "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-234",
5
  "epoch": 3.0,
6
  "eval_steps": 500,
7
  "global_step": 234,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.49097472924187724,
15
+ "eval_loss": 0.7057711482048035,
16
+ "eval_runtime": 0.6548,
17
+ "eval_samples_per_second": 423.062,
18
+ "eval_steps_per_second": 7.636,
19
  "step": 78
20
  },
21
  {
22
  "epoch": 2.0,
23
+ "eval_accuracy": 0.631768953068592,
24
+ "eval_loss": 0.6515233516693115,
25
+ "eval_runtime": 0.6593,
26
+ "eval_samples_per_second": 420.154,
27
+ "eval_steps_per_second": 7.584,
28
  "step": 156
29
  },
30
  {
31
  "epoch": 3.0,
32
+ "eval_accuracy": 0.6425992779783394,
33
+ "eval_loss": 0.6529138684272766,
34
+ "eval_runtime": 0.6631,
35
+ "eval_samples_per_second": 417.743,
36
+ "eval_steps_per_second": 7.54,
37
  "step": 234
38
  }
39
  ],
 
58
  "train_batch_size": 32,
59
  "trial_name": null,
60
  "trial_params": {
61
+ "classifier_dropout": 0.24469588923063107,
62
+ "learning_rate": 1.632929904930613e-05,
63
+ "max_length": 512,
64
  "num_train_epochs": 3,
65
  "per_device_train_batch_size": 32
66
  }
run-0/checkpoint-78/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87b50ecc41734e36153aa45d5a491b8ab4c441473c3e75910abe6431fe84eef7
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:323ace2db6bab1e6e929d5b595b5250337041d498d57a05f760f17c5e956f2e4
3
  size 437958648
run-0/checkpoint-78/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5b3e229c210ce1d0ad666e76892a5e35259d9d21122f18788cd8dcc65010599
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:371c0728bdbc0eb2af5f5259fe6fb2c1afd86a146991072227290489d01c8e3c
3
  size 876038394
run-0/checkpoint-78/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e796b5f158f149ebbb5393a6a5926a9cb01ce01c4f1f213d6b293813f37644c1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c1af07f2874294a244b6f46adb4de7c26a7d29b7c2dc41f6701bbfa466035e7
3
  size 1064
run-0/checkpoint-78/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 78,
3
- "best_metric": 0.4729241877256318,
4
  "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-78",
5
  "epoch": 1.0,
6
  "eval_steps": 500,
@@ -11,11 +11,11 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.4729241877256318,
15
- "eval_loss": 0.7100459933280945,
16
- "eval_runtime": 0.6584,
17
- "eval_samples_per_second": 420.731,
18
- "eval_steps_per_second": 7.594,
19
  "step": 78
20
  }
21
  ],
@@ -40,9 +40,9 @@
40
  "train_batch_size": 32,
41
  "trial_name": null,
42
  "trial_params": {
43
- "classifier_dropout": 0.4312273582787619,
44
- "learning_rate": 2.007242870680699e-06,
45
- "max_length": 256,
46
  "num_train_epochs": 3,
47
  "per_device_train_batch_size": 32
48
  }
 
1
  {
2
  "best_global_step": 78,
3
+ "best_metric": 0.49097472924187724,
4
  "best_model_checkpoint": "bert-base-uncased-finetuned-rte-run_3/run-0/checkpoint-78",
5
  "epoch": 1.0,
6
  "eval_steps": 500,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.49097472924187724,
15
+ "eval_loss": 0.7057711482048035,
16
+ "eval_runtime": 0.6548,
17
+ "eval_samples_per_second": 423.062,
18
+ "eval_steps_per_second": 7.636,
19
  "step": 78
20
  }
21
  ],
 
40
  "train_batch_size": 32,
41
  "trial_name": null,
42
  "trial_params": {
43
+ "classifier_dropout": 0.24469588923063107,
44
+ "learning_rate": 1.632929904930613e-05,
45
+ "max_length": 512,
46
  "num_train_epochs": 3,
47
  "per_device_train_batch_size": 32
48
  }
run-0/checkpoint-78/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4000a623a24e954176bac1dfc31b929c06df0ac83251a2e392753a57a3145fa8
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17bcef98605aae5d137d7d5a84cac1f1e0091c73c323300da1659a9ef388f310
3
  size 5432
runs/Apr07_10-59-04_d0bdfe9fd409/events.out.tfevents.1744023700.d0bdfe9fd409.3962.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:407c546b1094eaeba412107ac6a0f9b0e01223d5286ca74ef7d42c5ed74f1eb1
3
+ size 5776
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:353fc9b250b05a6892f466799a9d7f0f589218dd504abd1d311575b8f27dd725
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17bcef98605aae5d137d7d5a84cac1f1e0091c73c323300da1659a9ef388f310
3
  size 5432