Melo1512 commited on
Commit
c8e29ba
·
verified ·
1 Parent(s): d8f0901

End of training

Browse files
README.md CHANGED
@@ -23,7 +23,7 @@ model-index:
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
- value: 0.7304832713754646
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,8 +33,8 @@ should probably proofread and complete it, then remove this comment. -->
33
 
34
  This model is a fine-tuned version of [facebook/vit-msn-small](https://huggingface.co/facebook/vit-msn-small) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
- - Loss: 0.5725
37
- - Accuracy: 0.7305
38
 
39
  ## Model description
40
 
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.8810408921933085
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
33
 
34
  This model is a fine-tuned version of [facebook/vit-msn-small](https://huggingface.co/facebook/vit-msn-small) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
+ - Loss: 0.2823
37
+ - Accuracy: 0.8810
38
 
39
  ## Model description
40
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.23076923076923,
3
+ "eval_accuracy": 0.8810408921933085,
4
+ "eval_loss": 0.28232070803642273,
5
+ "eval_runtime": 2.2781,
6
+ "eval_samples_per_second": 236.157,
7
+ "eval_steps_per_second": 3.951,
8
+ "total_flos": 2.915891733872517e+17,
9
+ "train_loss": 0.38718650341033933,
10
+ "train_runtime": 154.7877,
11
+ "train_samples_per_second": 104.207,
12
+ "train_steps_per_second": 0.388
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.23076923076923,
3
+ "eval_accuracy": 0.8810408921933085,
4
+ "eval_loss": 0.28232070803642273,
5
+ "eval_runtime": 2.2781,
6
+ "eval_samples_per_second": 236.157,
7
+ "eval_steps_per_second": 3.951
8
+ }
runs/Jan15_17-47-09_c583982b4f3d/events.out.tfevents.1736963429.c583982b4f3d.215.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:306b2a042f385622c45a533a1583b001d603aa78d96f7f08f017fa7cb90ef877
3
+ size 405
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.23076923076923,
3
+ "total_flos": 2.915891733872517e+17,
4
+ "train_loss": 0.38718650341033933,
5
+ "train_runtime": 154.7877,
6
+ "train_samples_per_second": 104.207,
7
+ "train_steps_per_second": 0.388
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,174 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.28232070803642273,
3
+ "best_model_checkpoint": "vit-msn-small-lateral_flow_ivalidation_green_test/checkpoint-13",
4
+ "epoch": 9.23076923076923,
5
+ "eval_steps": 500,
6
+ "global_step": 60,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.9230769230769231,
13
+ "eval_accuracy": 0.79182156133829,
14
+ "eval_loss": 0.4105704724788666,
15
+ "eval_runtime": 2.4272,
16
+ "eval_samples_per_second": 221.657,
17
+ "eval_steps_per_second": 3.708,
18
+ "step": 6
19
+ },
20
+ {
21
+ "epoch": 1.5384615384615383,
22
+ "grad_norm": 35.90373229980469,
23
+ "learning_rate": 4.62962962962963e-05,
24
+ "loss": 0.5328,
25
+ "step": 10
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "eval_accuracy": 0.8810408921933085,
30
+ "eval_loss": 0.28232070803642273,
31
+ "eval_runtime": 2.428,
32
+ "eval_samples_per_second": 221.579,
33
+ "eval_steps_per_second": 3.707,
34
+ "step": 13
35
+ },
36
+ {
37
+ "epoch": 2.9230769230769234,
38
+ "eval_accuracy": 0.8587360594795539,
39
+ "eval_loss": 0.3050999343395233,
40
+ "eval_runtime": 2.3639,
41
+ "eval_samples_per_second": 227.587,
42
+ "eval_steps_per_second": 3.807,
43
+ "step": 19
44
+ },
45
+ {
46
+ "epoch": 3.076923076923077,
47
+ "grad_norm": 7.078850269317627,
48
+ "learning_rate": 3.7037037037037037e-05,
49
+ "loss": 0.4244,
50
+ "step": 20
51
+ },
52
+ {
53
+ "epoch": 4.0,
54
+ "eval_accuracy": 0.8996282527881041,
55
+ "eval_loss": 0.2912784218788147,
56
+ "eval_runtime": 2.5552,
57
+ "eval_samples_per_second": 210.551,
58
+ "eval_steps_per_second": 3.522,
59
+ "step": 26
60
+ },
61
+ {
62
+ "epoch": 4.615384615384615,
63
+ "grad_norm": 7.146331310272217,
64
+ "learning_rate": 2.777777777777778e-05,
65
+ "loss": 0.3755,
66
+ "step": 30
67
+ },
68
+ {
69
+ "epoch": 4.923076923076923,
70
+ "eval_accuracy": 0.9052044609665427,
71
+ "eval_loss": 0.2840980887413025,
72
+ "eval_runtime": 2.4709,
73
+ "eval_samples_per_second": 217.734,
74
+ "eval_steps_per_second": 3.642,
75
+ "step": 32
76
+ },
77
+ {
78
+ "epoch": 6.0,
79
+ "eval_accuracy": 0.8828996282527881,
80
+ "eval_loss": 0.32043400406837463,
81
+ "eval_runtime": 2.4097,
82
+ "eval_samples_per_second": 223.265,
83
+ "eval_steps_per_second": 3.735,
84
+ "step": 39
85
+ },
86
+ {
87
+ "epoch": 6.153846153846154,
88
+ "grad_norm": 5.55441427230835,
89
+ "learning_rate": 1.8518518518518518e-05,
90
+ "loss": 0.3569,
91
+ "step": 40
92
+ },
93
+ {
94
+ "epoch": 6.923076923076923,
95
+ "eval_accuracy": 0.8810408921933085,
96
+ "eval_loss": 0.2981695532798767,
97
+ "eval_runtime": 2.3262,
98
+ "eval_samples_per_second": 231.282,
99
+ "eval_steps_per_second": 3.869,
100
+ "step": 45
101
+ },
102
+ {
103
+ "epoch": 7.6923076923076925,
104
+ "grad_norm": 4.577017784118652,
105
+ "learning_rate": 9.259259259259259e-06,
106
+ "loss": 0.3157,
107
+ "step": 50
108
+ },
109
+ {
110
+ "epoch": 8.0,
111
+ "eval_accuracy": 0.8643122676579925,
112
+ "eval_loss": 0.33173713088035583,
113
+ "eval_runtime": 2.3575,
114
+ "eval_samples_per_second": 228.205,
115
+ "eval_steps_per_second": 3.818,
116
+ "step": 52
117
+ },
118
+ {
119
+ "epoch": 8.923076923076923,
120
+ "eval_accuracy": 0.724907063197026,
121
+ "eval_loss": 0.5731077194213867,
122
+ "eval_runtime": 2.4282,
123
+ "eval_samples_per_second": 221.561,
124
+ "eval_steps_per_second": 3.706,
125
+ "step": 58
126
+ },
127
+ {
128
+ "epoch": 9.23076923076923,
129
+ "grad_norm": 6.767743110656738,
130
+ "learning_rate": 0.0,
131
+ "loss": 0.3177,
132
+ "step": 60
133
+ },
134
+ {
135
+ "epoch": 9.23076923076923,
136
+ "eval_accuracy": 0.7304832713754646,
137
+ "eval_loss": 0.5724764466285706,
138
+ "eval_runtime": 2.3931,
139
+ "eval_samples_per_second": 224.808,
140
+ "eval_steps_per_second": 3.761,
141
+ "step": 60
142
+ },
143
+ {
144
+ "epoch": 9.23076923076923,
145
+ "step": 60,
146
+ "total_flos": 2.915891733872517e+17,
147
+ "train_loss": 0.38718650341033933,
148
+ "train_runtime": 154.7877,
149
+ "train_samples_per_second": 104.207,
150
+ "train_steps_per_second": 0.388
151
+ }
152
+ ],
153
+ "logging_steps": 10,
154
+ "max_steps": 60,
155
+ "num_input_tokens_seen": 0,
156
+ "num_train_epochs": 10,
157
+ "save_steps": 500,
158
+ "stateful_callbacks": {
159
+ "TrainerControl": {
160
+ "args": {
161
+ "should_epoch_stop": false,
162
+ "should_evaluate": false,
163
+ "should_log": false,
164
+ "should_save": true,
165
+ "should_training_stop": true
166
+ },
167
+ "attributes": {}
168
+ }
169
+ },
170
+ "total_flos": 2.915891733872517e+17,
171
+ "train_batch_size": 64,
172
+ "trial_name": null,
173
+ "trial_params": null
174
+ }