Shawon16 commited on
Commit
0a1377b
·
verified ·
1 Parent(s): 8539167

End of training

Browse files
README.md CHANGED
@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [facebook/timesformer-base-finetuned-k400](https://huggingface.co/facebook/timesformer-base-finetuned-k400) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.8131
22
- - Accuracy: 0.7849
23
 
24
  ## Model description
25
 
@@ -45,13 +45,14 @@ The following hyperparameters were used during training:
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
  - lr_scheduler_warmup_ratio: 0.1
48
- - training_steps: 101
49
 
50
  ### Training results
51
 
52
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
53
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
54
- | 0.8303 | 1.0 | 101 | 0.1456 | 0.9902 |
 
55
 
56
 
57
  ### Framework versions
 
18
 
19
  This model is a fine-tuned version of [facebook/timesformer-base-finetuned-k400](https://huggingface.co/facebook/timesformer-base-finetuned-k400) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.7582
22
+ - Accuracy: 0.7928
23
 
24
  ## Model description
25
 
 
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
  - lr_scheduler_warmup_ratio: 0.1
48
+ - training_steps: 366
49
 
50
  ### Training results
51
 
52
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
53
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
54
+ | 1.0449 | 0.5 | 183 | 0.0172 | 0.9939 |
55
+ | 0.0056 | 1.5 | 366 | 0.0024 | 1.0 |
56
 
57
 
58
  ### Framework versions
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_accuracy": 0.7848605577689243,
4
- "eval_loss": 0.8131076693534851,
5
- "eval_runtime": 82.7652,
6
- "eval_samples_per_second": 3.033,
7
- "eval_steps_per_second": 0.387
8
  }
 
1
  {
2
+ "epoch": 1.5,
3
+ "eval_accuracy": 0.7928286852589641,
4
+ "eval_loss": 0.758155345916748,
5
+ "eval_runtime": 81.0092,
6
+ "eval_samples_per_second": 3.098,
7
+ "eval_steps_per_second": 0.395
8
  }
confusion_matrix_kfold_fold_1.png CHANGED
confusion_matrix_test_fold_1.png CHANGED
confusion_matrix_trainfold_fold_1.png CHANGED
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.0,
3
- "eval_accuracy": 0.7848605577689243,
4
- "eval_loss": 0.8131076693534851,
5
- "eval_runtime": 82.7652,
6
- "eval_samples_per_second": 3.033,
7
- "eval_steps_per_second": 0.387
8
  }
 
1
  {
2
+ "epoch": 1.5,
3
+ "eval_accuracy": 0.7928286852589641,
4
+ "eval_loss": 0.758155345916748,
5
+ "eval_runtime": 81.0092,
6
+ "eval_samples_per_second": 3.098,
7
+ "eval_steps_per_second": 0.395
8
  }
trainer_state.json CHANGED
@@ -1,50 +1,73 @@
1
  {
2
- "best_metric": 0.990159901599016,
3
- "best_model_checkpoint": "/media/cse/HDD/Shawon/shawon/10 fold timesformer/Timesformer_default_fold_10_10_epoch_noAug_batch8_codecheck/checkpoint-101",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 101,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.9900990099009901,
13
- "grad_norm": 7.038530349731445,
14
- "learning_rate": 5.555555555555556e-07,
15
- "loss": 0.8303,
16
  "step": 100
17
  },
18
  {
19
- "epoch": 1.0,
20
- "eval_accuracy": 0.990159901599016,
21
- "eval_loss": 0.14564795792102814,
22
- "eval_runtime": 267.0652,
23
- "eval_samples_per_second": 3.044,
24
- "eval_steps_per_second": 0.382,
25
- "step": 101
26
  },
27
  {
28
- "epoch": 1.0,
29
- "step": 101,
30
- "total_flos": 7.07971920321577e+17,
31
- "train_loss": 0.8236100951043686,
32
- "train_runtime": 621.4991,
33
- "train_samples_per_second": 1.3,
34
- "train_steps_per_second": 0.163
35
  },
36
  {
37
- "epoch": 1.0,
38
- "eval_accuracy": 0.7848605577689243,
39
- "eval_loss": 0.8131076693534851,
40
- "eval_runtime": 82.7652,
41
- "eval_samples_per_second": 3.033,
42
- "eval_steps_per_second": 0.387,
43
- "step": 101
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  }
45
  ],
46
  "logging_steps": 100,
47
- "max_steps": 101,
48
  "num_input_tokens_seen": 0,
49
  "num_train_epochs": 9223372036854775807,
50
  "save_steps": 500,
@@ -60,7 +83,7 @@
60
  "attributes": {}
61
  }
62
  },
63
- "total_flos": 7.07971920321577e+17,
64
  "train_batch_size": 8,
65
  "trial_name": null,
66
  "trial_params": null
 
1
  {
2
+ "best_metric": 1.0,
3
+ "best_model_checkpoint": "/media/cse/HDD/Shawon/shawon/10 fold timesformer/Timesformer_default_fold_10_10_epoch_noAug_batch8_codecheck/checkpoint-366",
4
+ "epoch": 1.5,
5
  "eval_steps": 500,
6
+ "global_step": 366,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.273224043715847,
13
+ "grad_norm": 3.3262431621551514,
14
+ "learning_rate": 4.0425531914893614e-05,
15
+ "loss": 1.0449,
16
  "step": 100
17
  },
18
  {
19
+ "epoch": 0.5,
20
+ "eval_accuracy": 0.9938650306748467,
21
+ "eval_loss": 0.017213916406035423,
22
+ "eval_runtime": 55.9924,
23
+ "eval_samples_per_second": 2.911,
24
+ "eval_steps_per_second": 0.375,
25
+ "step": 183
26
  },
27
  {
28
+ "epoch": 1.046448087431694,
29
+ "grad_norm": 0.36886924505233765,
30
+ "learning_rate": 2.5227963525835867e-05,
31
+ "loss": 0.038,
32
+ "step": 200
 
 
33
  },
34
  {
35
+ "epoch": 1.319672131147541,
36
+ "grad_norm": 0.04929419606924057,
37
+ "learning_rate": 1.0030395136778116e-05,
38
+ "loss": 0.0056,
39
+ "step": 300
40
+ },
41
+ {
42
+ "epoch": 1.5,
43
+ "eval_accuracy": 1.0,
44
+ "eval_loss": 0.0024167420342564583,
45
+ "eval_runtime": 62.5343,
46
+ "eval_samples_per_second": 2.607,
47
+ "eval_steps_per_second": 0.336,
48
+ "step": 366
49
+ },
50
+ {
51
+ "epoch": 1.5,
52
+ "step": 366,
53
+ "total_flos": 2.5655220082940314e+18,
54
+ "train_loss": 0.2977769932623118,
55
+ "train_runtime": 1336.9205,
56
+ "train_samples_per_second": 2.19,
57
+ "train_steps_per_second": 0.274
58
+ },
59
+ {
60
+ "epoch": 1.5,
61
+ "eval_accuracy": 0.7928286852589641,
62
+ "eval_loss": 0.758155345916748,
63
+ "eval_runtime": 81.0092,
64
+ "eval_samples_per_second": 3.098,
65
+ "eval_steps_per_second": 0.395,
66
+ "step": 366
67
  }
68
  ],
69
  "logging_steps": 100,
70
+ "max_steps": 366,
71
  "num_input_tokens_seen": 0,
72
  "num_train_epochs": 9223372036854775807,
73
  "save_steps": 500,
 
83
  "attributes": {}
84
  }
85
  },
86
+ "total_flos": 2.5655220082940314e+18,
87
  "train_batch_size": 8,
88
  "trial_name": null,
89
  "trial_params": null