ShruthiPV commited on
Commit
218e810
·
1 Parent(s): afe3762

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.23,
3
- "eval_accuracy": 0.8387096774193549,
4
- "eval_loss": 0.44136250019073486,
5
- "eval_runtime": 23.6897,
6
- "eval_samples_per_second": 6.543,
7
- "eval_steps_per_second": 0.844
8
  }
 
1
  {
2
  "epoch": 3.23,
3
+ "eval_accuracy": 0.8580645161290322,
4
+ "eval_loss": 0.4741174578666687,
5
+ "eval_runtime": 27.5301,
6
+ "eval_samples_per_second": 5.63,
7
+ "eval_steps_per_second": 0.726
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63ee08ce120c5566ac3e6e2ed9495176569bb89abcff2e7a07904c9b78d039e8
3
  size 345003509
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:412e0b49ea61a7b31947d243d149273bcac5c4480989cfcdccbda9d0f004661d
3
  size 345003509
runs/Jun12_14-38-12_dgx002/events.out.tfevents.1686574136.dgx002.65055.2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea15b0581d27e37369091a358bff9be8713a884cf7351d2fdc9d617361d35117
3
- size 363
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12ad7548e7641bb20bd3a4c4064b8f9175c061f6a15aa57325ff4f6f4ed2d443
3
+ size 686
runs/Jun12_15-01-28_dgx002/1686574901.4763446/events.out.tfevents.1686574901.dgx002.69669.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc4b78a7635fa3ab09c99118945543c06a8837024c8509f221c14fdcaa33f2d4
3
+ size 5883
runs/Jun12_15-01-28_dgx002/events.out.tfevents.1686574901.dgx002.69669.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bed0d250b345f4f19e7c214c007852b525a66ea84463d0070b2b60cc7e3177cd
3
+ size 5416
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.23,
3
- "eval_accuracy": 0.8387096774193549,
4
- "eval_loss": 0.44136250019073486,
5
- "eval_runtime": 23.6897,
6
- "eval_samples_per_second": 6.543,
7
- "eval_steps_per_second": 0.844
8
  }
 
1
  {
2
  "epoch": 3.23,
3
+ "eval_accuracy": 0.8580645161290322,
4
+ "eval_loss": 0.4741174578666687,
5
+ "eval_runtime": 27.5301,
6
+ "eval_samples_per_second": 5.63,
7
+ "eval_steps_per_second": 0.726
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9142857142857143,
3
- "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-114",
4
  "epoch": 3.22972972972973,
5
  "global_step": 148,
6
  "is_hyper_param_search": false,
@@ -10,148 +10,148 @@
10
  {
11
  "epoch": 0.07,
12
  "learning_rate": 3.3333333333333335e-05,
13
- "loss": 2.2957,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.14,
18
  "learning_rate": 4.81203007518797e-05,
19
- "loss": 2.1731,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.2,
24
  "learning_rate": 4.43609022556391e-05,
25
- "loss": 2.046,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.26,
30
- "eval_accuracy": 0.5285714285714286,
31
- "eval_loss": 1.6963216066360474,
32
- "eval_runtime": 10.977,
33
- "eval_samples_per_second": 6.377,
34
- "eval_steps_per_second": 0.82,
35
  "step": 38
36
  },
37
  {
38
  "epoch": 1.01,
39
  "learning_rate": 4.0601503759398494e-05,
40
- "loss": 1.8937,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 1.08,
45
  "learning_rate": 3.6842105263157895e-05,
46
- "loss": 1.4425,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 1.15,
51
  "learning_rate": 3.3082706766917295e-05,
52
- "loss": 1.1676,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.22,
57
  "learning_rate": 2.9323308270676693e-05,
58
- "loss": 0.8324,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.26,
63
- "eval_accuracy": 0.7714285714285715,
64
- "eval_loss": 0.7202897667884827,
65
- "eval_runtime": 12.3258,
66
- "eval_samples_per_second": 5.679,
67
- "eval_steps_per_second": 0.73,
68
  "step": 76
69
  },
70
  {
71
  "epoch": 2.03,
72
  "learning_rate": 2.556390977443609e-05,
73
- "loss": 0.8057,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 2.09,
78
  "learning_rate": 2.1804511278195487e-05,
79
- "loss": 0.5698,
80
  "step": 90
81
  },
82
  {
83
  "epoch": 2.16,
84
  "learning_rate": 1.8045112781954888e-05,
85
- "loss": 0.5088,
86
  "step": 100
87
  },
88
  {
89
  "epoch": 2.23,
90
  "learning_rate": 1.4285714285714285e-05,
91
- "loss": 0.4576,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 2.26,
96
- "eval_accuracy": 0.9142857142857143,
97
- "eval_loss": 0.40682417154312134,
98
- "eval_runtime": 11.5894,
99
- "eval_samples_per_second": 6.04,
100
- "eval_steps_per_second": 0.777,
101
  "step": 114
102
  },
103
  {
104
  "epoch": 3.04,
105
  "learning_rate": 1.0526315789473684e-05,
106
- "loss": 0.2856,
107
  "step": 120
108
  },
109
  {
110
  "epoch": 3.11,
111
  "learning_rate": 6.766917293233083e-06,
112
- "loss": 0.2348,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 3.18,
117
  "learning_rate": 3.007518796992481e-06,
118
- "loss": 0.2632,
119
  "step": 140
120
  },
121
  {
122
  "epoch": 3.23,
123
  "eval_accuracy": 0.8714285714285714,
124
- "eval_loss": 0.33855465054512024,
125
- "eval_runtime": 11.4954,
126
- "eval_samples_per_second": 6.089,
127
- "eval_steps_per_second": 0.783,
128
  "step": 148
129
  },
130
  {
131
  "epoch": 3.23,
132
  "step": 148,
133
  "total_flos": 1.460491890402263e+18,
134
- "train_loss": 1.024867109350256,
135
- "train_runtime": 599.0938,
136
- "train_samples_per_second": 1.976,
137
- "train_steps_per_second": 0.247
138
  },
139
  {
140
  "epoch": 3.23,
141
- "eval_accuracy": 0.8387096774193549,
142
- "eval_loss": 0.4413624405860901,
143
- "eval_runtime": 26.0793,
144
- "eval_samples_per_second": 5.943,
145
- "eval_steps_per_second": 0.767,
146
  "step": 148
147
  },
148
  {
149
  "epoch": 3.23,
150
- "eval_accuracy": 0.8387096774193549,
151
- "eval_loss": 0.44136250019073486,
152
- "eval_runtime": 23.6897,
153
- "eval_samples_per_second": 6.543,
154
- "eval_steps_per_second": 0.844,
155
  "step": 148
156
  }
157
  ],
 
1
  {
2
+ "best_metric": 0.8714285714285714,
3
+ "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-148",
4
  "epoch": 3.22972972972973,
5
  "global_step": 148,
6
  "is_hyper_param_search": false,
 
10
  {
11
  "epoch": 0.07,
12
  "learning_rate": 3.3333333333333335e-05,
13
+ "loss": 2.3,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.14,
18
  "learning_rate": 4.81203007518797e-05,
19
+ "loss": 2.1696,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.2,
24
  "learning_rate": 4.43609022556391e-05,
25
+ "loss": 2.1374,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.26,
30
+ "eval_accuracy": 0.4142857142857143,
31
+ "eval_loss": 1.831816554069519,
32
+ "eval_runtime": 11.4195,
33
+ "eval_samples_per_second": 6.13,
34
+ "eval_steps_per_second": 0.788,
35
  "step": 38
36
  },
37
  {
38
  "epoch": 1.01,
39
  "learning_rate": 4.0601503759398494e-05,
40
+ "loss": 1.9867,
41
  "step": 40
42
  },
43
  {
44
  "epoch": 1.08,
45
  "learning_rate": 3.6842105263157895e-05,
46
+ "loss": 1.4944,
47
  "step": 50
48
  },
49
  {
50
  "epoch": 1.15,
51
  "learning_rate": 3.3082706766917295e-05,
52
+ "loss": 1.2525,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.22,
57
  "learning_rate": 2.9323308270676693e-05,
58
+ "loss": 0.9554,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.26,
63
+ "eval_accuracy": 0.6428571428571429,
64
+ "eval_loss": 1.0205751657485962,
65
+ "eval_runtime": 11.6614,
66
+ "eval_samples_per_second": 6.003,
67
+ "eval_steps_per_second": 0.772,
68
  "step": 76
69
  },
70
  {
71
  "epoch": 2.03,
72
  "learning_rate": 2.556390977443609e-05,
73
+ "loss": 0.8545,
74
  "step": 80
75
  },
76
  {
77
  "epoch": 2.09,
78
  "learning_rate": 2.1804511278195487e-05,
79
+ "loss": 0.6184,
80
  "step": 90
81
  },
82
  {
83
  "epoch": 2.16,
84
  "learning_rate": 1.8045112781954888e-05,
85
+ "loss": 0.6031,
86
  "step": 100
87
  },
88
  {
89
  "epoch": 2.23,
90
  "learning_rate": 1.4285714285714285e-05,
91
+ "loss": 0.4549,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 2.26,
96
+ "eval_accuracy": 0.8428571428571429,
97
+ "eval_loss": 0.5566275715827942,
98
+ "eval_runtime": 10.0032,
99
+ "eval_samples_per_second": 6.998,
100
+ "eval_steps_per_second": 0.9,
101
  "step": 114
102
  },
103
  {
104
  "epoch": 3.04,
105
  "learning_rate": 1.0526315789473684e-05,
106
+ "loss": 0.3658,
107
  "step": 120
108
  },
109
  {
110
  "epoch": 3.11,
111
  "learning_rate": 6.766917293233083e-06,
112
+ "loss": 0.2797,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 3.18,
117
  "learning_rate": 3.007518796992481e-06,
118
+ "loss": 0.3045,
119
  "step": 140
120
  },
121
  {
122
  "epoch": 3.23,
123
  "eval_accuracy": 0.8714285714285714,
124
+ "eval_loss": 0.46514713764190674,
125
+ "eval_runtime": 11.0086,
126
+ "eval_samples_per_second": 6.359,
127
+ "eval_steps_per_second": 0.818,
128
  "step": 148
129
  },
130
  {
131
  "epoch": 3.23,
132
  "step": 148,
133
  "total_flos": 1.460491890402263e+18,
134
+ "train_loss": 1.079887928189458,
135
+ "train_runtime": 604.0644,
136
+ "train_samples_per_second": 1.96,
137
+ "train_steps_per_second": 0.245
138
  },
139
  {
140
  "epoch": 3.23,
141
+ "eval_accuracy": 0.8580645161290322,
142
+ "eval_loss": 0.4741174578666687,
143
+ "eval_runtime": 28.7326,
144
+ "eval_samples_per_second": 5.395,
145
+ "eval_steps_per_second": 0.696,
146
  "step": 148
147
  },
148
  {
149
  "epoch": 3.23,
150
+ "eval_accuracy": 0.8580645161290322,
151
+ "eval_loss": 0.4741174578666687,
152
+ "eval_runtime": 27.5301,
153
+ "eval_samples_per_second": 5.63,
154
+ "eval_steps_per_second": 0.726,
155
  "step": 148
156
  }
157
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:962862fdf4513cbd5fb5621011b496dc0107d57aa60f4cdb2a4bde5eb28cc1ab
3
  size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cacf5b5fdd1a5a07663d19e16b9613a85eb1c73ff99eac8490bec2296bb9dfd
3
  size 3643