bmedeiros commited on
Commit
539d368
·
verified ·
1 Parent(s): 98c6da6

End of training

Browse files
README.md CHANGED
@@ -23,7 +23,7 @@ model-index:
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
- value: 0.8705882352941177
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,8 +33,8 @@ should probably proofread and complete it, then remove this comment. -->
33
 
34
  This model is a fine-tuned version of [facebook/vit-msn-small](https://huggingface.co/facebook/vit-msn-small) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
- - Loss: 0.3307
37
- - Accuracy: 0.8706
38
 
39
  ## Model description
40
 
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.9235294117647059
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
33
 
34
  This model is a fine-tuned version of [facebook/vit-msn-small](https://huggingface.co/facebook/vit-msn-small) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
+ - Loss: 0.1866
37
+ - Accuracy: 0.9235
38
 
39
  ## Model description
40
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "eval_accuracy": 0.9235294117647059,
4
+ "eval_loss": 0.18661858141422272,
5
+ "eval_runtime": 0.574,
6
+ "eval_samples_per_second": 296.153,
7
+ "eval_steps_per_second": 10.452,
8
+ "total_flos": 2.9117823636013056e+17,
9
+ "train_loss": 0.28690393567085265,
10
+ "train_runtime": 133.8542,
11
+ "train_samples_per_second": 111.166,
12
+ "train_steps_per_second": 0.896
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "eval_accuracy": 0.9235294117647059,
4
+ "eval_loss": 0.18661858141422272,
5
+ "eval_runtime": 0.574,
6
+ "eval_samples_per_second": 296.153,
7
+ "eval_steps_per_second": 10.452
8
+ }
runs/Feb21_15-54-52_3abf47ac437f/events.out.tfevents.1740153459.3abf47ac437f.209.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d545e38339fe97c9c4a0b7b2f31e0c654ccdcbdbe59d70f68edfa5c5fc776b2
3
+ size 405
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "total_flos": 2.9117823636013056e+17,
4
+ "train_loss": 0.28690393567085265,
5
+ "train_runtime": 133.8542,
6
+ "train_samples_per_second": 111.166,
7
+ "train_steps_per_second": 0.896
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,306 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9235294117647059,
3
+ "best_model_checkpoint": "vit-msn-small-lipid-invalidation-nobg/checkpoint-84",
4
+ "epoch": 20.0,
5
+ "eval_steps": 500,
6
+ "global_step": 120,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.7058823529411765,
14
+ "eval_loss": 0.5867760181427002,
15
+ "eval_runtime": 0.536,
16
+ "eval_samples_per_second": 317.18,
17
+ "eval_steps_per_second": 11.195,
18
+ "step": 6
19
+ },
20
+ {
21
+ "epoch": 1.6666666666666665,
22
+ "grad_norm": 7.053527355194092,
23
+ "learning_rate": 4.166666666666667e-05,
24
+ "loss": 0.583,
25
+ "step": 10
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "eval_accuracy": 0.8705882352941177,
30
+ "eval_loss": 0.28499943017959595,
31
+ "eval_runtime": 0.5262,
32
+ "eval_samples_per_second": 323.046,
33
+ "eval_steps_per_second": 11.402,
34
+ "step": 12
35
+ },
36
+ {
37
+ "epoch": 3.0,
38
+ "eval_accuracy": 0.8647058823529412,
39
+ "eval_loss": 0.31667008996009827,
40
+ "eval_runtime": 0.5367,
41
+ "eval_samples_per_second": 316.749,
42
+ "eval_steps_per_second": 11.179,
43
+ "step": 18
44
+ },
45
+ {
46
+ "epoch": 3.3333333333333335,
47
+ "grad_norm": 8.924991607666016,
48
+ "learning_rate": 4.62962962962963e-05,
49
+ "loss": 0.4996,
50
+ "step": 20
51
+ },
52
+ {
53
+ "epoch": 4.0,
54
+ "eval_accuracy": 0.8294117647058824,
55
+ "eval_loss": 0.37376630306243896,
56
+ "eval_runtime": 0.5648,
57
+ "eval_samples_per_second": 301.01,
58
+ "eval_steps_per_second": 10.624,
59
+ "step": 24
60
+ },
61
+ {
62
+ "epoch": 5.0,
63
+ "grad_norm": 9.494657516479492,
64
+ "learning_rate": 4.166666666666667e-05,
65
+ "loss": 0.3097,
66
+ "step": 30
67
+ },
68
+ {
69
+ "epoch": 5.0,
70
+ "eval_accuracy": 0.9176470588235294,
71
+ "eval_loss": 0.21050500869750977,
72
+ "eval_runtime": 0.5568,
73
+ "eval_samples_per_second": 305.341,
74
+ "eval_steps_per_second": 10.777,
75
+ "step": 30
76
+ },
77
+ {
78
+ "epoch": 6.0,
79
+ "eval_accuracy": 0.8823529411764706,
80
+ "eval_loss": 0.26954787969589233,
81
+ "eval_runtime": 0.539,
82
+ "eval_samples_per_second": 315.42,
83
+ "eval_steps_per_second": 11.132,
84
+ "step": 36
85
+ },
86
+ {
87
+ "epoch": 6.666666666666667,
88
+ "grad_norm": 10.003211975097656,
89
+ "learning_rate": 3.7037037037037037e-05,
90
+ "loss": 0.2893,
91
+ "step": 40
92
+ },
93
+ {
94
+ "epoch": 7.0,
95
+ "eval_accuracy": 0.8941176470588236,
96
+ "eval_loss": 0.23035354912281036,
97
+ "eval_runtime": 0.5649,
98
+ "eval_samples_per_second": 300.957,
99
+ "eval_steps_per_second": 10.622,
100
+ "step": 42
101
+ },
102
+ {
103
+ "epoch": 8.0,
104
+ "eval_accuracy": 0.8529411764705882,
105
+ "eval_loss": 0.297798752784729,
106
+ "eval_runtime": 0.5553,
107
+ "eval_samples_per_second": 306.117,
108
+ "eval_steps_per_second": 10.804,
109
+ "step": 48
110
+ },
111
+ {
112
+ "epoch": 8.333333333333334,
113
+ "grad_norm": 5.467005252838135,
114
+ "learning_rate": 3.240740740740741e-05,
115
+ "loss": 0.3305,
116
+ "step": 50
117
+ },
118
+ {
119
+ "epoch": 9.0,
120
+ "eval_accuracy": 0.888235294117647,
121
+ "eval_loss": 0.2952236533164978,
122
+ "eval_runtime": 0.5508,
123
+ "eval_samples_per_second": 308.654,
124
+ "eval_steps_per_second": 10.894,
125
+ "step": 54
126
+ },
127
+ {
128
+ "epoch": 10.0,
129
+ "grad_norm": 13.88063907623291,
130
+ "learning_rate": 2.777777777777778e-05,
131
+ "loss": 0.2775,
132
+ "step": 60
133
+ },
134
+ {
135
+ "epoch": 10.0,
136
+ "eval_accuracy": 0.888235294117647,
137
+ "eval_loss": 0.2661350965499878,
138
+ "eval_runtime": 0.5605,
139
+ "eval_samples_per_second": 303.291,
140
+ "eval_steps_per_second": 10.704,
141
+ "step": 60
142
+ },
143
+ {
144
+ "epoch": 11.0,
145
+ "eval_accuracy": 0.8823529411764706,
146
+ "eval_loss": 0.25326403975486755,
147
+ "eval_runtime": 0.5723,
148
+ "eval_samples_per_second": 297.046,
149
+ "eval_steps_per_second": 10.484,
150
+ "step": 66
151
+ },
152
+ {
153
+ "epoch": 11.666666666666666,
154
+ "grad_norm": 7.95721960067749,
155
+ "learning_rate": 2.314814814814815e-05,
156
+ "loss": 0.223,
157
+ "step": 70
158
+ },
159
+ {
160
+ "epoch": 12.0,
161
+ "eval_accuracy": 0.888235294117647,
162
+ "eval_loss": 0.2585911154747009,
163
+ "eval_runtime": 0.5681,
164
+ "eval_samples_per_second": 299.222,
165
+ "eval_steps_per_second": 10.561,
166
+ "step": 72
167
+ },
168
+ {
169
+ "epoch": 13.0,
170
+ "eval_accuracy": 0.9176470588235294,
171
+ "eval_loss": 0.2033568024635315,
172
+ "eval_runtime": 0.5439,
173
+ "eval_samples_per_second": 312.563,
174
+ "eval_steps_per_second": 11.032,
175
+ "step": 78
176
+ },
177
+ {
178
+ "epoch": 13.333333333333334,
179
+ "grad_norm": 10.242790222167969,
180
+ "learning_rate": 1.8518518518518518e-05,
181
+ "loss": 0.216,
182
+ "step": 80
183
+ },
184
+ {
185
+ "epoch": 14.0,
186
+ "eval_accuracy": 0.9235294117647059,
187
+ "eval_loss": 0.18661858141422272,
188
+ "eval_runtime": 0.5426,
189
+ "eval_samples_per_second": 313.32,
190
+ "eval_steps_per_second": 11.058,
191
+ "step": 84
192
+ },
193
+ {
194
+ "epoch": 15.0,
195
+ "grad_norm": 5.154911518096924,
196
+ "learning_rate": 1.388888888888889e-05,
197
+ "loss": 0.1858,
198
+ "step": 90
199
+ },
200
+ {
201
+ "epoch": 15.0,
202
+ "eval_accuracy": 0.888235294117647,
203
+ "eval_loss": 0.2631073296070099,
204
+ "eval_runtime": 0.5262,
205
+ "eval_samples_per_second": 323.067,
206
+ "eval_steps_per_second": 11.402,
207
+ "step": 90
208
+ },
209
+ {
210
+ "epoch": 16.0,
211
+ "eval_accuracy": 0.888235294117647,
212
+ "eval_loss": 0.2439642697572708,
213
+ "eval_runtime": 0.5331,
214
+ "eval_samples_per_second": 318.919,
215
+ "eval_steps_per_second": 11.256,
216
+ "step": 96
217
+ },
218
+ {
219
+ "epoch": 16.666666666666668,
220
+ "grad_norm": 3.7305550575256348,
221
+ "learning_rate": 9.259259259259259e-06,
222
+ "loss": 0.1866,
223
+ "step": 100
224
+ },
225
+ {
226
+ "epoch": 17.0,
227
+ "eval_accuracy": 0.8941176470588236,
228
+ "eval_loss": 0.2479913830757141,
229
+ "eval_runtime": 0.6023,
230
+ "eval_samples_per_second": 282.236,
231
+ "eval_steps_per_second": 9.961,
232
+ "step": 102
233
+ },
234
+ {
235
+ "epoch": 18.0,
236
+ "eval_accuracy": 0.8647058823529412,
237
+ "eval_loss": 0.38971054553985596,
238
+ "eval_runtime": 0.5781,
239
+ "eval_samples_per_second": 294.055,
240
+ "eval_steps_per_second": 10.378,
241
+ "step": 108
242
+ },
243
+ {
244
+ "epoch": 18.333333333333332,
245
+ "grad_norm": 16.46074676513672,
246
+ "learning_rate": 4.6296296296296296e-06,
247
+ "loss": 0.1701,
248
+ "step": 110
249
+ },
250
+ {
251
+ "epoch": 19.0,
252
+ "eval_accuracy": 0.8647058823529412,
253
+ "eval_loss": 0.3998810350894928,
254
+ "eval_runtime": 0.5376,
255
+ "eval_samples_per_second": 316.242,
256
+ "eval_steps_per_second": 11.161,
257
+ "step": 114
258
+ },
259
+ {
260
+ "epoch": 20.0,
261
+ "grad_norm": 5.165961265563965,
262
+ "learning_rate": 0.0,
263
+ "loss": 0.1717,
264
+ "step": 120
265
+ },
266
+ {
267
+ "epoch": 20.0,
268
+ "eval_accuracy": 0.8705882352941177,
269
+ "eval_loss": 0.33069366216659546,
270
+ "eval_runtime": 0.5592,
271
+ "eval_samples_per_second": 304.018,
272
+ "eval_steps_per_second": 10.73,
273
+ "step": 120
274
+ },
275
+ {
276
+ "epoch": 20.0,
277
+ "step": 120,
278
+ "total_flos": 2.9117823636013056e+17,
279
+ "train_loss": 0.28690393567085265,
280
+ "train_runtime": 133.8542,
281
+ "train_samples_per_second": 111.166,
282
+ "train_steps_per_second": 0.896
283
+ }
284
+ ],
285
+ "logging_steps": 10,
286
+ "max_steps": 120,
287
+ "num_input_tokens_seen": 0,
288
+ "num_train_epochs": 20,
289
+ "save_steps": 500,
290
+ "stateful_callbacks": {
291
+ "TrainerControl": {
292
+ "args": {
293
+ "should_epoch_stop": false,
294
+ "should_evaluate": false,
295
+ "should_log": false,
296
+ "should_save": true,
297
+ "should_training_stop": true
298
+ },
299
+ "attributes": {}
300
+ }
301
+ },
302
+ "total_flos": 2.9117823636013056e+17,
303
+ "train_batch_size": 32,
304
+ "trial_name": null,
305
+ "trial_params": null
306
+ }