BeckerAnas commited on
Commit
d7c14a4
·
verified ·
1 Parent(s): b85ca70

End of training

Browse files
README.md CHANGED
@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [facebook/convnext-tiny-224](https://huggingface.co/facebook/convnext-tiny-224) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.8437
22
- - Accuracy: 0.5488
23
 
24
  ## Model description
25
 
 
18
 
19
  This model is a fine-tuned version of [facebook/convnext-tiny-224](https://huggingface.co/facebook/convnext-tiny-224) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.8995
22
+ - Accuracy: 0.5602
23
 
24
  ## Model description
25
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_accuracy": 0.56015625,
4
+ "eval_loss": 0.8994671702384949,
5
+ "eval_runtime": 8.7552,
6
+ "eval_samples_per_second": 146.2,
7
+ "eval_steps_per_second": 4.569,
8
+ "total_flos": 3.473836763020001e+17,
9
+ "train_loss": 0.9776477946175469,
10
+ "train_runtime": 256.1822,
11
+ "train_samples_per_second": 53.962,
12
+ "train_steps_per_second": 0.422
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_accuracy": 0.55078125,
4
+ "eval_loss": 0.8595054745674133,
5
+ "eval_runtime": 3.0351,
6
+ "eval_samples_per_second": 168.691,
7
+ "eval_steps_per_second": 5.272
8
+ }
runs/May23_08-53-52_68351e6ded98/events.out.tfevents.1747990783.68351e6ded98.10093.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:064d7d47f81ea56ead27f9db170d73247ba84808f46208a9cec5c97ecc6af65c
3
+ size 722
test_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_accuracy": 0.56015625,
4
+ "eval_loss": 0.8994671702384949,
5
+ "eval_runtime": 8.7552,
6
+ "eval_samples_per_second": 146.2,
7
+ "eval_steps_per_second": 4.569
8
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "total_flos": 3.473836763020001e+17,
4
+ "train_loss": 0.9776477946175469,
5
+ "train_runtime": 256.1822,
6
+ "train_samples_per_second": 53.962,
7
+ "train_steps_per_second": 0.422
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,140 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 72,
3
+ "best_metric": 0.55078125,
4
+ "best_model_checkpoint": "convnext-tiny-224-finetuned-alzheimer-MRI/checkpoint-72",
5
+ "epoch": 3.0,
6
+ "eval_steps": 500,
7
+ "global_step": 108,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.2777777777777778,
14
+ "grad_norm": 2.0088706016540527,
15
+ "learning_rate": 4.0909090909090915e-05,
16
+ "loss": 1.3197,
17
+ "step": 10
18
+ },
19
+ {
20
+ "epoch": 0.5555555555555556,
21
+ "grad_norm": 2.71425199508667,
22
+ "learning_rate": 4.5876288659793814e-05,
23
+ "loss": 1.1091,
24
+ "step": 20
25
+ },
26
+ {
27
+ "epoch": 0.8333333333333334,
28
+ "grad_norm": 1.3623636960983276,
29
+ "learning_rate": 4.0721649484536084e-05,
30
+ "loss": 1.0151,
31
+ "step": 30
32
+ },
33
+ {
34
+ "epoch": 1.0,
35
+ "eval_accuracy": 0.5390625,
36
+ "eval_loss": 0.9395096302032471,
37
+ "eval_runtime": 3.0069,
38
+ "eval_samples_per_second": 170.276,
39
+ "eval_steps_per_second": 5.321,
40
+ "step": 36
41
+ },
42
+ {
43
+ "epoch": 1.1111111111111112,
44
+ "grad_norm": 1.7469203472137451,
45
+ "learning_rate": 3.5567010309278354e-05,
46
+ "loss": 0.9697,
47
+ "step": 40
48
+ },
49
+ {
50
+ "epoch": 1.3888888888888888,
51
+ "grad_norm": 1.5095868110656738,
52
+ "learning_rate": 3.0412371134020617e-05,
53
+ "loss": 0.9514,
54
+ "step": 50
55
+ },
56
+ {
57
+ "epoch": 1.6666666666666665,
58
+ "grad_norm": 4.194490432739258,
59
+ "learning_rate": 2.5257731958762887e-05,
60
+ "loss": 0.9032,
61
+ "step": 60
62
+ },
63
+ {
64
+ "epoch": 1.9444444444444444,
65
+ "grad_norm": 2.88313889503479,
66
+ "learning_rate": 2.0103092783505157e-05,
67
+ "loss": 0.9132,
68
+ "step": 70
69
+ },
70
+ {
71
+ "epoch": 2.0,
72
+ "eval_accuracy": 0.55078125,
73
+ "eval_loss": 0.8595054745674133,
74
+ "eval_runtime": 2.9709,
75
+ "eval_samples_per_second": 172.338,
76
+ "eval_steps_per_second": 5.386,
77
+ "step": 72
78
+ },
79
+ {
80
+ "epoch": 2.2222222222222223,
81
+ "grad_norm": 2.767746686935425,
82
+ "learning_rate": 1.4948453608247423e-05,
83
+ "loss": 0.9126,
84
+ "step": 80
85
+ },
86
+ {
87
+ "epoch": 2.5,
88
+ "grad_norm": 3.7601568698883057,
89
+ "learning_rate": 9.793814432989691e-06,
90
+ "loss": 0.884,
91
+ "step": 90
92
+ },
93
+ {
94
+ "epoch": 2.7777777777777777,
95
+ "grad_norm": 3.920647382736206,
96
+ "learning_rate": 4.639175257731959e-06,
97
+ "loss": 0.876,
98
+ "step": 100
99
+ },
100
+ {
101
+ "epoch": 3.0,
102
+ "eval_accuracy": 0.548828125,
103
+ "eval_loss": 0.8436535596847534,
104
+ "eval_runtime": 2.9884,
105
+ "eval_samples_per_second": 171.329,
106
+ "eval_steps_per_second": 5.354,
107
+ "step": 108
108
+ },
109
+ {
110
+ "epoch": 3.0,
111
+ "step": 108,
112
+ "total_flos": 3.473836763020001e+17,
113
+ "train_loss": 0.9776477946175469,
114
+ "train_runtime": 256.1822,
115
+ "train_samples_per_second": 53.962,
116
+ "train_steps_per_second": 0.422
117
+ }
118
+ ],
119
+ "logging_steps": 10,
120
+ "max_steps": 108,
121
+ "num_input_tokens_seen": 0,
122
+ "num_train_epochs": 3,
123
+ "save_steps": 500,
124
+ "stateful_callbacks": {
125
+ "TrainerControl": {
126
+ "args": {
127
+ "should_epoch_stop": false,
128
+ "should_evaluate": false,
129
+ "should_log": false,
130
+ "should_save": true,
131
+ "should_training_stop": true
132
+ },
133
+ "attributes": {}
134
+ }
135
+ },
136
+ "total_flos": 3.473836763020001e+17,
137
+ "train_batch_size": 32,
138
+ "trial_name": null,
139
+ "trial_params": null
140
+ }