Shawon16 commited on
Commit
1e3228b
·
verified ·
1 Parent(s): f275ad2

End of training

Browse files
README.md CHANGED
@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [facebook/timesformer-base-finetuned-k400](https://huggingface.co/facebook/timesformer-base-finetuned-k400) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.5098
22
- - Accuracy: 0.8367
23
 
24
  ## Model description
25
 
@@ -45,14 +45,13 @@ The following hyperparameters were used during training:
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
  - lr_scheduler_warmup_ratio: 0.1
48
- - training_steps: 366
49
 
50
  ### Training results
51
 
52
- | Training Loss | Epoch | Step | Validation Loss | Accuracy |
53
- |:-------------:|:------:|:----:|:---------------:|:--------:|
54
- | 1.0933 | 0.5027 | 184 | 0.0142 | 1.0 |
55
- | 0.011 | 1.4973 | 366 | 0.0109 | 0.9938 |
56
 
57
 
58
  ### Framework versions
 
18
 
19
  This model is a fine-tuned version of [facebook/timesformer-base-finetuned-k400](https://huggingface.co/facebook/timesformer-base-finetuned-k400) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.9561
22
+ - Accuracy: 0.6773
23
 
24
  ## Model description
25
 
 
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
  - lr_scheduler_warmup_ratio: 0.1
48
+ - training_steps: 101
49
 
50
  ### Training results
51
 
52
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy |
53
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|
54
+ | 0.8886 | 1.0 | 101 | 0.1661 | 0.9828 |
 
55
 
56
 
57
  ### Framework versions
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.4972677595628414,
3
- "eval_accuracy": 0.8366533864541833,
4
- "eval_loss": 0.5097954869270325,
5
- "eval_runtime": 56.3553,
6
- "eval_samples_per_second": 4.454,
7
- "eval_steps_per_second": 0.568
8
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_accuracy": 0.6772908366533864,
4
+ "eval_loss": 0.9560578465461731,
5
+ "eval_runtime": 55.4125,
6
+ "eval_samples_per_second": 4.53,
7
+ "eval_steps_per_second": 0.577
8
  }
confusion_matrix_kfold_fold_1.png CHANGED
confusion_matrix_test_fold_1.png CHANGED
confusion_matrix_trainfold_fold_1.png CHANGED
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 1.4972677595628414,
3
- "eval_accuracy": 0.8366533864541833,
4
- "eval_loss": 0.5097954869270325,
5
- "eval_runtime": 56.3553,
6
- "eval_samples_per_second": 4.454,
7
- "eval_steps_per_second": 0.568
8
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_accuracy": 0.6772908366533864,
4
+ "eval_loss": 0.9560578465461731,
5
+ "eval_runtime": 55.4125,
6
+ "eval_samples_per_second": 4.53,
7
+ "eval_steps_per_second": 0.577
8
  }
trainer_state.json CHANGED
@@ -1,73 +1,50 @@
1
  {
2
- "best_metric": 1.0,
3
- "best_model_checkpoint": "/media/cse/HDD/Shawon/shawon/10 fold timesformer/Timesformer_default_fold_10_10_epoch_noAug_batch8_codecheck/checkpoint-184",
4
- "epoch": 1.4972677595628414,
5
  "eval_steps": 500,
6
- "global_step": 366,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.273224043715847,
13
- "grad_norm": 2.266233444213867,
14
- "learning_rate": 4.0425531914893614e-05,
15
- "loss": 1.0933,
16
  "step": 100
17
  },
18
  {
19
- "epoch": 0.5027322404371585,
20
- "eval_accuracy": 1.0,
21
- "eval_loss": 0.014155284501612186,
22
- "eval_runtime": 37.8295,
23
- "eval_samples_per_second": 4.282,
24
- "eval_steps_per_second": 0.555,
25
- "step": 184
26
  },
27
  {
28
- "epoch": 1.0437158469945356,
29
- "grad_norm": 0.3162294626235962,
30
- "learning_rate": 2.5227963525835867e-05,
31
- "loss": 0.0458,
32
- "step": 200
 
 
33
  },
34
  {
35
- "epoch": 1.3169398907103824,
36
- "grad_norm": 0.509850263595581,
37
- "learning_rate": 1.0030395136778116e-05,
38
- "loss": 0.011,
39
- "step": 300
40
- },
41
- {
42
- "epoch": 1.4972677595628414,
43
- "eval_accuracy": 0.9938271604938271,
44
- "eval_loss": 0.010920087806880474,
45
- "eval_runtime": 38.0242,
46
- "eval_samples_per_second": 4.26,
47
- "eval_steps_per_second": 0.552,
48
- "step": 366
49
- },
50
- {
51
- "epoch": 1.4972677595628414,
52
- "step": 366,
53
- "total_flos": 2.5593885881922355e+18,
54
- "train_loss": 0.3163567338484884,
55
- "train_runtime": 953.4888,
56
- "train_samples_per_second": 3.071,
57
- "train_steps_per_second": 0.384
58
- },
59
- {
60
- "epoch": 1.4972677595628414,
61
- "eval_accuracy": 0.8366533864541833,
62
- "eval_loss": 0.5097954869270325,
63
- "eval_runtime": 56.3553,
64
- "eval_samples_per_second": 4.454,
65
- "eval_steps_per_second": 0.568,
66
- "step": 366
67
  }
68
  ],
69
  "logging_steps": 100,
70
- "max_steps": 366,
71
  "num_input_tokens_seen": 0,
72
  "num_train_epochs": 9223372036854775807,
73
  "save_steps": 500,
@@ -83,7 +60,7 @@
83
  "attributes": {}
84
  }
85
  },
86
- "total_flos": 2.5593885881922355e+18,
87
  "train_batch_size": 8,
88
  "trial_name": null,
89
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.9828009828009828,
3
+ "best_model_checkpoint": "/media/cse/HDD/Shawon/shawon/10 fold timesformer/Timesformer_default_fold_10_10_epoch_noAug_batch8_codecheck/checkpoint-101",
4
+ "epoch": 1.0,
5
  "eval_steps": 500,
6
+ "global_step": 101,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.9900990099009901,
13
+ "grad_norm": 2.9471566677093506,
14
+ "learning_rate": 5.555555555555556e-07,
15
+ "loss": 0.8886,
16
  "step": 100
17
  },
18
  {
19
+ "epoch": 1.0,
20
+ "eval_accuracy": 0.9828009828009828,
21
+ "eval_loss": 0.16609854996204376,
22
+ "eval_runtime": 202.8409,
23
+ "eval_samples_per_second": 4.013,
24
+ "eval_steps_per_second": 0.503,
25
+ "step": 101
26
  },
27
  {
28
+ "epoch": 1.0,
29
+ "step": 101,
30
+ "total_flos": 7.07971920321577e+17,
31
+ "train_loss": 0.8806298740281917,
32
+ "train_runtime": 488.3542,
33
+ "train_samples_per_second": 1.655,
34
+ "train_steps_per_second": 0.207
35
  },
36
  {
37
+ "epoch": 1.0,
38
+ "eval_accuracy": 0.6772908366533864,
39
+ "eval_loss": 0.9560578465461731,
40
+ "eval_runtime": 55.4125,
41
+ "eval_samples_per_second": 4.53,
42
+ "eval_steps_per_second": 0.577,
43
+ "step": 101
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  }
45
  ],
46
  "logging_steps": 100,
47
+ "max_steps": 101,
48
  "num_input_tokens_seen": 0,
49
  "num_train_epochs": 9223372036854775807,
50
  "save_steps": 500,
 
60
  "attributes": {}
61
  }
62
  },
63
+ "total_flos": 7.07971920321577e+17,
64
  "train_batch_size": 8,
65
  "trial_name": null,
66
  "trial_params": null