HorcruxNo13 commited on
Commit
31284f4
1 Parent(s): e6e5df2

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 1.73991922900992e+17,
4
- "train_loss": 0.5857737362384796,
5
- "train_runtime": 257.742,
6
- "train_samples_per_second": 27.159,
7
- "train_steps_per_second": 0.217
8
  }
 
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 1.73991922900992e+17,
4
+ "train_loss": 0.5527358267988477,
5
+ "train_runtime": 138.7489,
6
+ "train_samples_per_second": 50.451,
7
+ "train_steps_per_second": 0.404
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b547a75b48f9d72a3e5efcc75583ec98f616f639143ccea478167058a79af3e
3
  size 110394865
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0a20659b3ad9192cfbe75a1ac3cab84dd5423b7ef52b01beafb000977e0e963
3
  size 110394865
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 1.73991922900992e+17,
4
- "train_loss": 0.5857737362384796,
5
- "train_runtime": 257.742,
6
- "train_samples_per_second": 27.159,
7
- "train_steps_per_second": 0.217
8
  }
 
1
  {
2
  "epoch": 7.0,
3
  "total_flos": 1.73991922900992e+17,
4
+ "train_loss": 0.5527358267988477,
5
+ "train_runtime": 138.7489,
6
+ "train_samples_per_second": 50.451,
7
+ "train_steps_per_second": 0.404
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.7416666666666667,
3
  "best_model_checkpoint": "swin-tiny-patch4-window7-224/checkpoint-48",
4
  "epoch": 7.0,
5
  "eval_steps": 500,
@@ -12,135 +12,135 @@
12
  "epoch": 1.0,
13
  "eval_accuracy": 0.7333333333333333,
14
  "eval_f1_score": 0.6205128205128204,
15
- "eval_loss": 0.5834997296333313,
16
  "eval_precision": 0.5377777777777778,
17
  "eval_recall": 0.7333333333333333,
18
- "eval_runtime": 33.1193,
19
- "eval_samples_per_second": 7.247,
20
- "eval_steps_per_second": 0.242,
21
  "step": 8
22
  },
23
  {
24
  "epoch": 1.25,
25
  "learning_rate": 4.600000000000001e-05,
26
- "loss": 0.6395,
27
  "step": 10
28
  },
29
  {
30
  "epoch": 2.0,
31
  "eval_accuracy": 0.7333333333333333,
32
  "eval_f1_score": 0.6205128205128204,
33
- "eval_loss": 0.5735692381858826,
34
  "eval_precision": 0.5377777777777778,
35
  "eval_recall": 0.7333333333333333,
36
- "eval_runtime": 2.0727,
37
- "eval_samples_per_second": 115.793,
38
- "eval_steps_per_second": 3.86,
39
  "step": 16
40
  },
41
  {
42
  "epoch": 2.5,
43
  "learning_rate": 3.6e-05,
44
- "loss": 0.5789,
45
  "step": 20
46
  },
47
  {
48
  "epoch": 3.0,
49
  "eval_accuracy": 0.7333333333333333,
50
  "eval_f1_score": 0.6205128205128204,
51
- "eval_loss": 0.5942796468734741,
52
  "eval_precision": 0.5377777777777778,
53
  "eval_recall": 0.7333333333333333,
54
- "eval_runtime": 2.0683,
55
- "eval_samples_per_second": 116.035,
56
- "eval_steps_per_second": 3.868,
57
  "step": 24
58
  },
59
  {
60
  "epoch": 3.75,
61
  "learning_rate": 2.6000000000000002e-05,
62
- "loss": 0.5887,
63
  "step": 30
64
  },
65
  {
66
  "epoch": 4.0,
67
  "eval_accuracy": 0.7333333333333333,
68
  "eval_f1_score": 0.6205128205128204,
69
- "eval_loss": 0.5613328218460083,
70
  "eval_precision": 0.5377777777777778,
71
  "eval_recall": 0.7333333333333333,
72
- "eval_runtime": 2.0585,
73
- "eval_samples_per_second": 116.592,
74
- "eval_steps_per_second": 3.886,
75
  "step": 32
76
  },
77
  {
78
  "epoch": 5.0,
79
  "learning_rate": 1.6000000000000003e-05,
80
- "loss": 0.5791,
81
  "step": 40
82
  },
83
  {
84
  "epoch": 5.0,
85
- "eval_accuracy": 0.7333333333333333,
86
- "eval_f1_score": 0.6205128205128204,
87
- "eval_loss": 0.5557453036308289,
88
- "eval_precision": 0.5377777777777778,
89
- "eval_recall": 0.7333333333333333,
90
- "eval_runtime": 2.0897,
91
- "eval_samples_per_second": 114.847,
92
- "eval_steps_per_second": 3.828,
93
  "step": 40
94
  },
95
  {
96
  "epoch": 6.0,
97
- "eval_accuracy": 0.7416666666666667,
98
- "eval_f1_score": 0.6396720831503441,
99
- "eval_loss": 0.5535091161727905,
100
- "eval_precision": 0.8089635854341737,
101
- "eval_recall": 0.7416666666666667,
102
- "eval_runtime": 1.9813,
103
- "eval_samples_per_second": 121.134,
104
- "eval_steps_per_second": 4.038,
105
  "step": 48
106
  },
107
  {
108
  "epoch": 6.25,
109
  "learning_rate": 6e-06,
110
- "loss": 0.5717,
111
  "step": 50
112
  },
113
  {
114
  "epoch": 7.0,
115
- "eval_accuracy": 0.7333333333333333,
116
- "eval_f1_score": 0.6205128205128204,
117
- "eval_loss": 0.5456091165542603,
118
- "eval_precision": 0.5377777777777778,
119
- "eval_recall": 0.7333333333333333,
120
- "eval_runtime": 2.0655,
121
- "eval_samples_per_second": 116.197,
122
- "eval_steps_per_second": 3.873,
123
  "step": 56
124
  },
125
  {
126
  "epoch": 7.0,
127
  "step": 56,
128
  "total_flos": 1.73991922900992e+17,
129
- "train_loss": 0.5857737362384796,
130
- "train_runtime": 257.742,
131
- "train_samples_per_second": 27.159,
132
- "train_steps_per_second": 0.217
133
  },
134
  {
135
  "epoch": 7.0,
136
- "eval_accuracy": 0.7366666666666667,
137
- "eval_f1_score": 0.6314646594113398,
138
- "eval_loss": 0.5486770868301392,
139
- "eval_precision": 0.8064765100671142,
140
- "eval_recall": 0.7366666666666667,
141
- "eval_runtime": 109.0657,
142
- "eval_samples_per_second": 2.751,
143
- "eval_steps_per_second": 0.092,
144
  "step": 56
145
  }
146
  ],
 
1
  {
2
+ "best_metric": 0.7625,
3
  "best_model_checkpoint": "swin-tiny-patch4-window7-224/checkpoint-48",
4
  "epoch": 7.0,
5
  "eval_steps": 500,
 
12
  "epoch": 1.0,
13
  "eval_accuracy": 0.7333333333333333,
14
  "eval_f1_score": 0.6205128205128204,
15
+ "eval_loss": 0.5696213841438293,
16
  "eval_precision": 0.5377777777777778,
17
  "eval_recall": 0.7333333333333333,
18
+ "eval_runtime": 1.8813,
19
+ "eval_samples_per_second": 127.574,
20
+ "eval_steps_per_second": 4.252,
21
  "step": 8
22
  },
23
  {
24
  "epoch": 1.25,
25
  "learning_rate": 4.600000000000001e-05,
26
+ "loss": 0.6683,
27
  "step": 10
28
  },
29
  {
30
  "epoch": 2.0,
31
  "eval_accuracy": 0.7333333333333333,
32
  "eval_f1_score": 0.6205128205128204,
33
+ "eval_loss": 0.5635157227516174,
34
  "eval_precision": 0.5377777777777778,
35
  "eval_recall": 0.7333333333333333,
36
+ "eval_runtime": 1.8341,
37
+ "eval_samples_per_second": 130.853,
38
+ "eval_steps_per_second": 4.362,
39
  "step": 16
40
  },
41
  {
42
  "epoch": 2.5,
43
  "learning_rate": 3.6e-05,
44
+ "loss": 0.5797,
45
  "step": 20
46
  },
47
  {
48
  "epoch": 3.0,
49
  "eval_accuracy": 0.7333333333333333,
50
  "eval_f1_score": 0.6205128205128204,
51
+ "eval_loss": 0.55841064453125,
52
  "eval_precision": 0.5377777777777778,
53
  "eval_recall": 0.7333333333333333,
54
+ "eval_runtime": 2.0336,
55
+ "eval_samples_per_second": 118.017,
56
+ "eval_steps_per_second": 3.934,
57
  "step": 24
58
  },
59
  {
60
  "epoch": 3.75,
61
  "learning_rate": 2.6000000000000002e-05,
62
+ "loss": 0.5547,
63
  "step": 30
64
  },
65
  {
66
  "epoch": 4.0,
67
  "eval_accuracy": 0.7333333333333333,
68
  "eval_f1_score": 0.6205128205128204,
69
+ "eval_loss": 0.5731536746025085,
70
  "eval_precision": 0.5377777777777778,
71
  "eval_recall": 0.7333333333333333,
72
+ "eval_runtime": 1.8352,
73
+ "eval_samples_per_second": 130.778,
74
+ "eval_steps_per_second": 4.359,
75
  "step": 32
76
  },
77
  {
78
  "epoch": 5.0,
79
  "learning_rate": 1.6000000000000003e-05,
80
+ "loss": 0.5165,
81
  "step": 40
82
  },
83
  {
84
  "epoch": 5.0,
85
+ "eval_accuracy": 0.7583333333333333,
86
+ "eval_f1_score": 0.6959050899349406,
87
+ "eval_loss": 0.5416003465652466,
88
+ "eval_precision": 0.7485882848714707,
89
+ "eval_recall": 0.7583333333333333,
90
+ "eval_runtime": 2.091,
91
+ "eval_samples_per_second": 114.78,
92
+ "eval_steps_per_second": 3.826,
93
  "step": 40
94
  },
95
  {
96
  "epoch": 6.0,
97
+ "eval_accuracy": 0.7625,
98
+ "eval_f1_score": 0.7033555352126014,
99
+ "eval_loss": 0.5488410592079163,
100
+ "eval_precision": 0.7561481481481481,
101
+ "eval_recall": 0.7625,
102
+ "eval_runtime": 2.0904,
103
+ "eval_samples_per_second": 114.812,
104
+ "eval_steps_per_second": 3.827,
105
  "step": 48
106
  },
107
  {
108
  "epoch": 6.25,
109
  "learning_rate": 6e-06,
110
+ "loss": 0.4893,
111
  "step": 50
112
  },
113
  {
114
  "epoch": 7.0,
115
+ "eval_accuracy": 0.7583333333333333,
116
+ "eval_f1_score": 0.7003333333333333,
117
+ "eval_loss": 0.5511656403541565,
118
+ "eval_precision": 0.7431547619047619,
119
+ "eval_recall": 0.7583333333333333,
120
+ "eval_runtime": 1.9003,
121
+ "eval_samples_per_second": 126.293,
122
+ "eval_steps_per_second": 4.21,
123
  "step": 56
124
  },
125
  {
126
  "epoch": 7.0,
127
  "step": 56,
128
  "total_flos": 1.73991922900992e+17,
129
+ "train_loss": 0.5527358267988477,
130
+ "train_runtime": 138.7489,
131
+ "train_samples_per_second": 50.451,
132
+ "train_steps_per_second": 0.404
133
  },
134
  {
135
  "epoch": 7.0,
136
+ "eval_accuracy": 0.78,
137
+ "eval_f1_score": 0.7315167493796526,
138
+ "eval_loss": 0.5118212699890137,
139
+ "eval_precision": 0.7896499764558155,
140
+ "eval_recall": 0.78,
141
+ "eval_runtime": 2.3258,
142
+ "eval_samples_per_second": 128.99,
143
+ "eval_steps_per_second": 4.3,
144
  "step": 56
145
  }
146
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb7e8116dbe569fb96ff854b905cb0bc3ae5795528e7afede2c8328a68bddc7d
3
  size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eba1d171a372a5066ba1cf45c0e4bcb11be97010d86e34d8bc234c36402be07
3
  size 4091