alyzbane commited on
Commit
bc1108e
·
verified ·
1 Parent(s): fbc2003

End of training

Browse files
README.md CHANGED
@@ -45,7 +45,7 @@ should probably proofread and complete it, then remove this comment. -->
45
 
46
  This model is a fine-tuned version of [facebook/convnext-tiny-224](https://huggingface.co/facebook/convnext-tiny-224) on the imagefolder dataset.
47
  It achieves the following results on the evaluation set:
48
- - Loss: 0.0794
49
  - Precision: 0.9936
50
  - Recall: 0.9934
51
  - F1: 0.9934
@@ -82,21 +82,24 @@ The following hyperparameters were used during training:
82
 
83
  ### Training results
84
 
85
- | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy | Top1 Accuracy | Error Rate |
86
- |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|:-------------:|:----------:|
87
- | 1.576 | 1.0 | 38 | 1.5660 | 0.3007 | 0.3684 | 0.2952 | 0.3479 | 0.3684 | 0.6521 |
88
- | 1.5469 | 2.0 | 76 | 1.5353 | 0.3141 | 0.4079 | 0.3215 | 0.3854 | 0.4079 | 0.6146 |
89
- | 1.5081 | 3.0 | 114 | 1.4782 | 0.5684 | 0.4671 | 0.3961 | 0.4436 | 0.4671 | 0.5564 |
90
- | 1.4278 | 4.0 | 152 | 1.3718 | 0.7088 | 0.6053 | 0.5840 | 0.5866 | 0.6053 | 0.4134 |
91
- | 1.2938 | 5.0 | 190 | 1.1909 | 0.8582 | 0.8355 | 0.8378 | 0.8290 | 0.8355 | 0.1710 |
92
- | 1.0696 | 6.0 | 228 | 0.9353 | 0.9243 | 0.9211 | 0.9215 | 0.9205 | 0.9211 | 0.0795 |
93
- | 0.789 | 7.0 | 266 | 0.6347 | 0.9680 | 0.9671 | 0.9673 | 0.9691 | 0.9671 | 0.0309 |
94
- | 0.506 | 8.0 | 304 | 0.3910 | 0.9750 | 0.9737 | 0.9739 | 0.9752 | 0.9737 | 0.0248 |
95
- | 0.2876 | 9.0 | 342 | 0.2126 | 0.9808 | 0.9803 | 0.9802 | 0.9814 | 0.9803 | 0.0186 |
96
- | 0.1722 | 10.0 | 380 | 0.1409 | 0.9809 | 0.9803 | 0.9799 | 0.9818 | 0.9803 | 0.0182 |
97
- | 0.1082 | 11.0 | 418 | 0.0794 | 0.9936 | 0.9934 | 0.9934 | 0.9939 | 0.9934 | 0.0061 |
98
- | 0.0715 | 12.0 | 456 | 0.0577 | 0.9936 | 0.9934 | 0.9934 | 0.9939 | 0.9934 | 0.0061 |
99
- | 0.0492 | 13.0 | 494 | 0.0440 | 0.9872 | 0.9868 | 0.9867 | 0.9879 | 0.9868 | 0.0121 |
 
 
 
100
 
101
 
102
  ### Framework versions
 
45
 
46
  This model is a fine-tuned version of [facebook/convnext-tiny-224](https://huggingface.co/facebook/convnext-tiny-224) on the imagefolder dataset.
47
  It achieves the following results on the evaluation set:
48
+ - Loss: 0.0266
49
  - Precision: 0.9936
50
  - Recall: 0.9934
51
  - F1: 0.9934
 
82
 
83
  ### Training results
84
 
85
+ | Training Loss | Epoch | Step | Accuracy | Error Rate | F1 | Validation Loss | Precision | Recall | Top1 Accuracy |
86
+ |:-------------:|:-----:|:----:|:--------:|:----------:|:------:|:---------------:|:---------:|:------:|:-------------:|
87
+ | 1.576 | 1.0 | 38 | 0.3479 | 0.6521 | 0.2952 | 1.5660 | 0.3007 | 0.3684 | 0.3684 |
88
+ | 1.5469 | 2.0 | 76 | 0.3854 | 0.6146 | 0.3215 | 1.5353 | 0.3141 | 0.4079 | 0.4079 |
89
+ | 1.5081 | 3.0 | 114 | 0.4436 | 0.5564 | 0.3961 | 1.4782 | 0.5684 | 0.4671 | 0.4671 |
90
+ | 1.4278 | 4.0 | 152 | 0.5866 | 0.4134 | 0.5840 | 1.3718 | 0.7088 | 0.6053 | 0.6053 |
91
+ | 1.2938 | 5.0 | 190 | 0.8290 | 0.1710 | 0.8378 | 1.1909 | 0.8582 | 0.8355 | 0.8355 |
92
+ | 1.0696 | 6.0 | 228 | 0.9205 | 0.0795 | 0.9215 | 0.9353 | 0.9243 | 0.9211 | 0.9211 |
93
+ | 0.789 | 7.0 | 266 | 0.9691 | 0.0309 | 0.9673 | 0.6347 | 0.9680 | 0.9671 | 0.9671 |
94
+ | 0.506 | 8.0 | 304 | 0.9752 | 0.0248 | 0.9739 | 0.3910 | 0.9750 | 0.9737 | 0.9737 |
95
+ | 0.2876 | 9.0 | 342 | 0.9814 | 0.0186 | 0.9802 | 0.2126 | 0.9808 | 0.9803 | 0.9803 |
96
+ | 0.1722 | 10.0 | 380 | 0.9818 | 0.0182 | 0.9799 | 0.1409 | 0.9809 | 0.9803 | 0.9803 |
97
+ | 0.1082 | 11.0 | 418 | 0.9939 | 0.0061 | 0.9934 | 0.0794 | 0.9936 | 0.9934 | 0.9934 |
98
+ | 0.0715 | 12.0 | 456 | 0.9939 | 0.0061 | 0.9934 | 0.0577 | 0.9936 | 0.9934 | 0.9934 |
99
+ | 0.0492 | 13.0 | 494 | 0.9879 | 0.0121 | 0.9867 | 0.0440 | 0.9872 | 0.9868 | 0.9868 |
100
+ | 0.0375 | 14.0 | 532 | 0.0266 | 0.9936 | 0.9934 | 0.9934 | 0.9939 | 0.9934 | 0.0061 |
101
+ | 0.029 | 15.0 | 570 | 0.0313 | 0.9936 | 0.9934 | 0.9934 | 0.9939 | 0.9934 | 0.0061 |
102
+ | 0.0158 | 16.0 | 608 | 0.0408 | 0.9872 | 0.9868 | 0.9867 | 0.9879 | 0.9868 | 0.0121 |
103
 
104
 
105
  ### Framework versions
all_results.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
- "epoch": 13.0,
3
  "eval_accuracy": 0.9939393939393939,
4
  "eval_error_rate": 0.0060606060606061,
5
  "eval_f1": 0.993419541966282,
6
- "eval_loss": 0.0794038251042366,
7
  "eval_precision": 0.9936145510835913,
8
  "eval_recall": 0.993421052631579,
9
- "eval_runtime": 51.0106,
10
- "eval_samples_per_second": 2.98,
11
- "eval_steps_per_second": 0.098,
12
  "eval_top1_accuracy": 0.993421052631579,
13
- "total_flos": 3.972506461105029e+17,
14
- "train_loss": 0.8004542765347099,
15
- "train_runtime": 7158.591,
16
- "train_samples_per_second": 5.096,
17
- "train_steps_per_second": 0.159
18
  }
 
1
  {
2
+ "epoch": 16.0,
3
  "eval_accuracy": 0.9939393939393939,
4
  "eval_error_rate": 0.0060606060606061,
5
  "eval_f1": 0.993419541966282,
6
+ "eval_loss": 0.02658209018409252,
7
  "eval_precision": 0.9936145510835913,
8
  "eval_recall": 0.993421052631579,
9
+ "eval_runtime": 48.6228,
10
+ "eval_samples_per_second": 3.126,
11
+ "eval_steps_per_second": 0.103,
12
  "eval_top1_accuracy": 0.993421052631579,
13
+ "total_flos": 4.889238721360036e+17,
14
+ "train_loss": 0.005142551405649436,
15
+ "train_runtime": 1686.6977,
16
+ "train_samples_per_second": 21.628,
17
+ "train_steps_per_second": 0.676
18
  }
classification_report.png ADDED
confusion_matrix.png ADDED
eval_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 13.0,
3
  "eval_accuracy": 0.9939393939393939,
4
  "eval_error_rate": 0.0060606060606061,
5
  "eval_f1": 0.993419541966282,
6
- "eval_loss": 0.0794038251042366,
7
  "eval_precision": 0.9936145510835913,
8
  "eval_recall": 0.993421052631579,
9
- "eval_runtime": 51.0106,
10
- "eval_samples_per_second": 2.98,
11
- "eval_steps_per_second": 0.098,
12
  "eval_top1_accuracy": 0.993421052631579
13
  }
 
1
  {
2
+ "epoch": 16.0,
3
  "eval_accuracy": 0.9939393939393939,
4
  "eval_error_rate": 0.0060606060606061,
5
  "eval_f1": 0.993419541966282,
6
+ "eval_loss": 0.02658209018409252,
7
  "eval_precision": 0.9936145510835913,
8
  "eval_recall": 0.993421052631579,
9
+ "eval_runtime": 48.6228,
10
+ "eval_samples_per_second": 3.126,
11
+ "eval_steps_per_second": 0.103,
12
  "eval_top1_accuracy": 0.993421052631579
13
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0799eed45249c597bd5706cd54239ba58459cb5916a27dddda3eccc89547767d
3
  size 111317164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62798162e3f57ffa189d6ee7c57129c330720ace9dcf029005622f20bf4eb7dd
3
  size 111317164
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 13.0,
3
- "total_flos": 3.972506461105029e+17,
4
- "train_loss": 0.8004542765347099,
5
- "train_runtime": 7158.591,
6
- "train_samples_per_second": 5.096,
7
- "train_steps_per_second": 0.159
8
  }
 
1
  {
2
+ "epoch": 16.0,
3
+ "total_flos": 4.889238721360036e+17,
4
+ "train_loss": 0.005142551405649436,
5
+ "train_runtime": 1686.6977,
6
+ "train_samples_per_second": 21.628,
7
+ "train_steps_per_second": 0.676
8
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.9939393939393939,
3
- "best_model_checkpoint": "convnext-tiny-224-finetuned-barkley\\checkpoint-418",
4
- "epoch": 13.0,
5
  "eval_steps": 500,
6
- "global_step": 494,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -334,13 +334,88 @@
334
  "step": 494
335
  },
336
  {
337
- "epoch": 13.0,
338
- "step": 494,
339
- "total_flos": 3.972506461105029e+17,
340
- "train_loss": 0.8004542765347099,
341
- "train_runtime": 7158.591,
342
- "train_samples_per_second": 5.096,
343
- "train_steps_per_second": 0.159
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
344
  }
345
  ],
346
  "logging_steps": 500,
@@ -369,7 +444,7 @@
369
  "attributes": {}
370
  }
371
  },
372
- "total_flos": 3.972506461105029e+17,
373
  "train_batch_size": 32,
374
  "trial_name": null,
375
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.02658209018409252,
3
+ "best_model_checkpoint": "convnext-tiny-224-finetuned-barkley\\checkpoint-532",
4
+ "epoch": 16.0,
5
  "eval_steps": 500,
6
+ "global_step": 608,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
334
  "step": 494
335
  },
336
  {
337
+ "epoch": 14.0,
338
+ "train_accuracy": 0.9950657894736842
339
+ },
340
+ {
341
+ "epoch": 14.0,
342
+ "grad_norm": 0.6904532313346863,
343
+ "learning_rate": 1.9527753116224055e-05,
344
+ "loss": 0.0375,
345
+ "step": 532
346
+ },
347
+ {
348
+ "epoch": 14.0,
349
+ "eval_accuracy": 0.9939393939393939,
350
+ "eval_error_rate": 0.0060606060606061,
351
+ "eval_f1": 0.993419541966282,
352
+ "eval_loss": 0.02658209018409252,
353
+ "eval_precision": 0.9936145510835913,
354
+ "eval_recall": 0.993421052631579,
355
+ "eval_runtime": 52.868,
356
+ "eval_samples_per_second": 2.875,
357
+ "eval_steps_per_second": 0.095,
358
+ "eval_top1_accuracy": 0.993421052631579,
359
+ "step": 532
360
+ },
361
+ {
362
+ "epoch": 15.0,
363
+ "train_accuracy": 0.993421052631579
364
+ },
365
+ {
366
+ "epoch": 15.0,
367
+ "grad_norm": 1.3837875127792358,
368
+ "learning_rate": 1.911506206288264e-05,
369
+ "loss": 0.029,
370
+ "step": 570
371
+ },
372
+ {
373
+ "epoch": 15.0,
374
+ "eval_accuracy": 0.9939393939393939,
375
+ "eval_error_rate": 0.0060606060606061,
376
+ "eval_f1": 0.993419541966282,
377
+ "eval_loss": 0.03128606453537941,
378
+ "eval_precision": 0.9936145510835913,
379
+ "eval_recall": 0.993421052631579,
380
+ "eval_runtime": 52.6477,
381
+ "eval_samples_per_second": 2.887,
382
+ "eval_steps_per_second": 0.095,
383
+ "eval_top1_accuracy": 0.993421052631579,
384
+ "step": 570
385
+ },
386
+ {
387
+ "epoch": 16.0,
388
+ "train_accuracy": 0.9985380116959064
389
+ },
390
+ {
391
+ "epoch": 16.0,
392
+ "grad_norm": 2.590073823928833,
393
+ "learning_rate": 1.8565251293796298e-05,
394
+ "loss": 0.0158,
395
+ "step": 608
396
+ },
397
+ {
398
+ "epoch": 16.0,
399
+ "eval_accuracy": 0.9878787878787879,
400
+ "eval_error_rate": 0.012121212121212088,
401
+ "eval_f1": 0.9867362170674966,
402
+ "eval_loss": 0.04083804041147232,
403
+ "eval_precision": 0.9872349657566376,
404
+ "eval_recall": 0.9868421052631579,
405
+ "eval_runtime": 52.9598,
406
+ "eval_samples_per_second": 2.87,
407
+ "eval_steps_per_second": 0.094,
408
+ "eval_top1_accuracy": 0.9868421052631579,
409
+ "step": 608
410
+ },
411
+ {
412
+ "epoch": 16.0,
413
+ "step": 608,
414
+ "total_flos": 4.889238721360036e+17,
415
+ "train_loss": 0.005142551405649436,
416
+ "train_runtime": 1686.6977,
417
+ "train_samples_per_second": 21.628,
418
+ "train_steps_per_second": 0.676
419
  }
420
  ],
421
  "logging_steps": 500,
 
444
  "attributes": {}
445
  }
446
  },
447
+ "total_flos": 4.889238721360036e+17,
448
  "train_batch_size": 32,
449
  "trial_name": null,
450
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b32c9a024fd0fe5d70f0247b1ad721619779776bf233e0e5351cdb8332e17696
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1b57bacbaaf9003431d769cf77cb4ade538a6e4c81615d2dad23b4a752322a3
3
  size 5176