Cheng98 commited on
Commit
4648129
·
verified ·
1 Parent(s): f919337

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -18,13 +18,11 @@ model-index:
18
  dataset:
19
  name: GLUE BOOLQ
20
  type: glue
21
- config: boolq
22
- split: validation
23
  args: boolq
24
  metrics:
25
  - name: Accuracy
26
  type: accuracy
27
- value: 0.7097859327217125
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -34,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
34
 
35
  This model is a fine-tuned version of [bert-base-cased](https://huggingface.co/bert-base-cased) on the GLUE BOOLQ dataset.
36
  It achieves the following results on the evaluation set:
37
- - Loss: 1.1221
38
- - Accuracy: 0.7098
39
 
40
  ## Model description
41
 
 
18
  dataset:
19
  name: GLUE BOOLQ
20
  type: glue
 
 
21
  args: boolq
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.7103975535168195
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [bert-base-cased](https://huggingface.co/bert-base-cased) on the GLUE BOOLQ dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 1.1407
36
+ - Accuracy: 0.7104
37
 
38
  ## Model description
39
 
all_results.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "epoch": 5.0,
3
- "eval_accuracy": 0.7097859327217125,
4
- "eval_loss": 1.1220989227294922,
5
- "eval_runtime": 6.9032,
6
  "eval_samples": 3270,
7
- "eval_samples_per_second": 473.694,
8
- "eval_steps_per_second": 59.248,
9
- "train_loss": 0.37518319857322563,
10
- "train_runtime": 326.8151,
11
  "train_samples": 9427,
12
- "train_samples_per_second": 144.225,
13
- "train_steps_per_second": 9.027
14
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "eval_accuracy": 0.7103975535168195,
4
+ "eval_loss": 1.1407246589660645,
5
+ "eval_runtime": 4.6126,
6
  "eval_samples": 3270,
7
+ "eval_samples_per_second": 708.933,
8
+ "eval_steps_per_second": 88.671,
9
+ "train_loss": 0.38077404086872685,
10
+ "train_runtime": 143.3727,
11
  "train_samples": 9427,
12
+ "train_samples_per_second": 328.759,
13
+ "train_steps_per_second": 20.576
14
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 5.0,
3
- "eval_accuracy": 0.7097859327217125,
4
- "eval_loss": 1.1220989227294922,
5
- "eval_runtime": 6.9032,
6
  "eval_samples": 3270,
7
- "eval_samples_per_second": 473.694,
8
- "eval_steps_per_second": 59.248
9
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "eval_accuracy": 0.7103975535168195,
4
+ "eval_loss": 1.1407246589660645,
5
+ "eval_runtime": 4.6126,
6
  "eval_samples": 3270,
7
+ "eval_samples_per_second": 708.933,
8
+ "eval_steps_per_second": 88.671
9
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e15e0a8f4da13c477a997731321b300c4e67e0affef277108b00b611b47c27d
3
  size 433315633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be7f2e36f176caecf8e31e394ebf5369e69b3674c887c05a212df130820e2b33
3
  size 433315633
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "train_loss": 0.37518319857322563,
4
- "train_runtime": 326.8151,
5
  "train_samples": 9427,
6
- "train_samples_per_second": 144.225,
7
- "train_steps_per_second": 9.027
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "train_loss": 0.38077404086872685,
4
+ "train_runtime": 143.3727,
5
  "train_samples": 9427,
6
+ "train_samples_per_second": 328.759,
7
+ "train_steps_per_second": 20.576
8
  }
trainer_state.json CHANGED
@@ -10,41 +10,41 @@
10
  {
11
  "epoch": 0.85,
12
  "learning_rate": 1.6610169491525424e-05,
13
- "loss": 0.6634,
14
  "step": 500
15
  },
16
  {
17
  "epoch": 1.69,
18
- "learning_rate": 1.3220338983050848e-05,
19
- "loss": 0.5784,
20
  "step": 1000
21
  },
22
  {
23
  "epoch": 2.54,
24
- "learning_rate": 9.830508474576272e-06,
25
- "loss": 0.4113,
26
  "step": 1500
27
  },
28
  {
29
  "epoch": 3.39,
30
- "learning_rate": 6.440677966101695e-06,
31
- "loss": 0.2685,
32
  "step": 2000
33
  },
34
  {
35
  "epoch": 4.24,
36
- "learning_rate": 3.0508474576271192e-06,
37
- "loss": 0.1735,
38
  "step": 2500
39
  },
40
  {
41
  "epoch": 5.0,
42
  "step": 2950,
43
  "total_flos": 3100434898598400.0,
44
- "train_loss": 0.37518319857322563,
45
- "train_runtime": 326.8151,
46
- "train_samples_per_second": 144.225,
47
- "train_steps_per_second": 9.027
48
  }
49
  ],
50
  "max_steps": 2950,
 
10
  {
11
  "epoch": 0.85,
12
  "learning_rate": 1.6610169491525424e-05,
13
+ "loss": 0.6633,
14
  "step": 500
15
  },
16
  {
17
  "epoch": 1.69,
18
+ "learning_rate": 1.3227118644067798e-05,
19
+ "loss": 0.5801,
20
  "step": 1000
21
  },
22
  {
23
  "epoch": 2.54,
24
+ "learning_rate": 9.844067796610171e-06,
25
+ "loss": 0.4258,
26
  "step": 1500
27
  },
28
  {
29
  "epoch": 3.39,
30
+ "learning_rate": 6.4542372881355944e-06,
31
+ "loss": 0.2802,
32
  "step": 2000
33
  },
34
  {
35
  "epoch": 4.24,
36
+ "learning_rate": 3.0644067796610173e-06,
37
+ "loss": 0.1836,
38
  "step": 2500
39
  },
40
  {
41
  "epoch": 5.0,
42
  "step": 2950,
43
  "total_flos": 3100434898598400.0,
44
+ "train_loss": 0.38077404086872685,
45
+ "train_runtime": 143.3727,
46
+ "train_samples_per_second": 328.759,
47
+ "train_steps_per_second": 20.576
48
  }
49
  ],
50
  "max_steps": 2950,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c41f5615188e374b7e0a00d54c3c74e42c1c1e8ec7c5c33fbba2a9f0aef5e36
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a7317d57843de51bc3494add8422c9807a70f1ebb84b24f1d55c54896286df4
3
  size 3963