justin1983 commited on
Commit
dfa31e8
·
1 Parent(s): 9916253

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -58,11 +58,13 @@
58
  "id2label": {
59
  "0": "human",
60
  "1": "machine",
61
- "2": "not_sure"
 
62
  },
63
  "initializer_range": 0.02,
64
  "intermediate_size": 3072,
65
  "label2id": {
 
66
  "human": "0",
67
  "machine": "1",
68
  "not_sure": "2"
 
58
  "id2label": {
59
  "0": "human",
60
  "1": "machine",
61
+ "2": "not_sure",
62
+ "3": "bot"
63
  },
64
  "initializer_range": 0.02,
65
  "intermediate_size": 3072,
66
  "label2id": {
67
+ "bot": "3",
68
  "human": "0",
69
  "machine": "1",
70
  "not_sure": "2"
last-checkpoint/config.json ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "facebook/wav2vec2-base",
3
+ "activation_dropout": 0.0,
4
+ "adapter_kernel_size": 3,
5
+ "adapter_stride": 2,
6
+ "add_adapter": false,
7
+ "apply_spec_augment": true,
8
+ "architectures": [
9
+ "Wav2Vec2ForSequenceClassification"
10
+ ],
11
+ "attention_dropout": 0.1,
12
+ "bos_token_id": 1,
13
+ "classifier_proj_size": 256,
14
+ "codevector_dim": 256,
15
+ "contrastive_logits_temperature": 0.1,
16
+ "conv_bias": false,
17
+ "conv_dim": [
18
+ 512,
19
+ 512,
20
+ 512,
21
+ 512,
22
+ 512,
23
+ 512,
24
+ 512
25
+ ],
26
+ "conv_kernel": [
27
+ 10,
28
+ 3,
29
+ 3,
30
+ 3,
31
+ 3,
32
+ 2,
33
+ 2
34
+ ],
35
+ "conv_stride": [
36
+ 5,
37
+ 2,
38
+ 2,
39
+ 2,
40
+ 2,
41
+ 2,
42
+ 2
43
+ ],
44
+ "ctc_loss_reduction": "sum",
45
+ "ctc_zero_infinity": false,
46
+ "diversity_loss_weight": 0.1,
47
+ "do_stable_layer_norm": false,
48
+ "eos_token_id": 2,
49
+ "feat_extract_activation": "gelu",
50
+ "feat_extract_norm": "group",
51
+ "feat_proj_dropout": 0.1,
52
+ "feat_quantizer_dropout": 0.0,
53
+ "final_dropout": 0.0,
54
+ "freeze_feat_extract_train": true,
55
+ "hidden_act": "gelu",
56
+ "hidden_dropout": 0.1,
57
+ "hidden_size": 768,
58
+ "id2label": {
59
+ "0": "human",
60
+ "1": "machine",
61
+ "2": "not_sure",
62
+ "3": "bot"
63
+ },
64
+ "initializer_range": 0.02,
65
+ "intermediate_size": 3072,
66
+ "label2id": {
67
+ "bot": "3",
68
+ "human": "0",
69
+ "machine": "1",
70
+ "not_sure": "2"
71
+ },
72
+ "layer_norm_eps": 1e-05,
73
+ "layerdrop": 0.0,
74
+ "mask_channel_length": 10,
75
+ "mask_channel_min_space": 1,
76
+ "mask_channel_other": 0.0,
77
+ "mask_channel_prob": 0.0,
78
+ "mask_channel_selection": "static",
79
+ "mask_feature_length": 10,
80
+ "mask_feature_min_masks": 0,
81
+ "mask_feature_prob": 0.0,
82
+ "mask_time_length": 10,
83
+ "mask_time_min_masks": 2,
84
+ "mask_time_min_space": 1,
85
+ "mask_time_other": 0.0,
86
+ "mask_time_prob": 0.05,
87
+ "mask_time_selection": "static",
88
+ "model_type": "wav2vec2",
89
+ "no_mask_channel_overlap": false,
90
+ "no_mask_time_overlap": false,
91
+ "num_adapter_layers": 3,
92
+ "num_attention_heads": 12,
93
+ "num_codevector_groups": 2,
94
+ "num_codevectors_per_group": 320,
95
+ "num_conv_pos_embedding_groups": 16,
96
+ "num_conv_pos_embeddings": 128,
97
+ "num_feat_extract_layers": 7,
98
+ "num_hidden_layers": 12,
99
+ "num_negatives": 100,
100
+ "output_hidden_size": 768,
101
+ "pad_token_id": 0,
102
+ "proj_codevector_dim": 256,
103
+ "tdnn_dilation": [
104
+ 1,
105
+ 2,
106
+ 3,
107
+ 1,
108
+ 1
109
+ ],
110
+ "tdnn_dim": [
111
+ 512,
112
+ 512,
113
+ 512,
114
+ 512,
115
+ 1500
116
+ ],
117
+ "tdnn_kernel": [
118
+ 5,
119
+ 3,
120
+ 3,
121
+ 1,
122
+ 1
123
+ ],
124
+ "torch_dtype": "float32",
125
+ "transformers_version": "4.28.0",
126
+ "use_weighted_layer_sum": false,
127
+ "vocab_size": 32,
128
+ "xvector_output_dim": 512
129
+ }
last-checkpoint/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37f1bdfd9e0aac203965c782dea354353b7d2d42e6e1d4b269832af24259f02b
3
+ size 756676997
last-checkpoint/preprocessor_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0.0,
7
+ "return_attention_mask": false,
8
+ "sampling_rate": 16000
9
+ }
last-checkpoint/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec49de05b6d0fc9760a0e4b8496ff8fbf4ceb9ee023b5d568ac0a6f84b39efd8
3
+ size 378349481
last-checkpoint/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f59301807699134cc6087afb3fa6b30a719118ddf7c2b9a165a4e3f81e46e979
3
+ size 13681
last-checkpoint/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f444185c3e228ee6138ca7334fba6706bbb1da32fc13357fe5c32dffd6ee429b
3
+ size 627
last-checkpoint/trainer_state.json ADDED
@@ -0,0 +1,199 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9507272727272728,
3
+ "best_model_checkpoint": "wav2vec2-base-finetuned-amd/checkpoint-290",
4
+ "epoch": 1.0,
5
+ "global_step": 290,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.03,
12
+ "learning_rate": 4.913793103448276e-05,
13
+ "loss": 1.2481,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.07,
18
+ "learning_rate": 4.827586206896552e-05,
19
+ "loss": 0.8865,
20
+ "step": 20
21
+ },
22
+ {
23
+ "epoch": 0.1,
24
+ "learning_rate": 4.741379310344828e-05,
25
+ "loss": 0.6388,
26
+ "step": 30
27
+ },
28
+ {
29
+ "epoch": 0.14,
30
+ "learning_rate": 4.655172413793104e-05,
31
+ "loss": 0.5496,
32
+ "step": 40
33
+ },
34
+ {
35
+ "epoch": 0.17,
36
+ "learning_rate": 4.5689655172413794e-05,
37
+ "loss": 0.4895,
38
+ "step": 50
39
+ },
40
+ {
41
+ "epoch": 0.21,
42
+ "learning_rate": 4.482758620689655e-05,
43
+ "loss": 0.3954,
44
+ "step": 60
45
+ },
46
+ {
47
+ "epoch": 0.24,
48
+ "learning_rate": 4.396551724137931e-05,
49
+ "loss": 0.4283,
50
+ "step": 70
51
+ },
52
+ {
53
+ "epoch": 0.28,
54
+ "learning_rate": 4.3103448275862066e-05,
55
+ "loss": 0.3545,
56
+ "step": 80
57
+ },
58
+ {
59
+ "epoch": 0.31,
60
+ "learning_rate": 4.224137931034483e-05,
61
+ "loss": 0.2903,
62
+ "step": 90
63
+ },
64
+ {
65
+ "epoch": 0.34,
66
+ "learning_rate": 4.1379310344827587e-05,
67
+ "loss": 0.371,
68
+ "step": 100
69
+ },
70
+ {
71
+ "epoch": 0.38,
72
+ "learning_rate": 4.0517241379310344e-05,
73
+ "loss": 0.3175,
74
+ "step": 110
75
+ },
76
+ {
77
+ "epoch": 0.41,
78
+ "learning_rate": 3.965517241379311e-05,
79
+ "loss": 0.351,
80
+ "step": 120
81
+ },
82
+ {
83
+ "epoch": 0.45,
84
+ "learning_rate": 3.8793103448275865e-05,
85
+ "loss": 0.2955,
86
+ "step": 130
87
+ },
88
+ {
89
+ "epoch": 0.48,
90
+ "learning_rate": 3.793103448275862e-05,
91
+ "loss": 0.294,
92
+ "step": 140
93
+ },
94
+ {
95
+ "epoch": 0.52,
96
+ "learning_rate": 3.7068965517241385e-05,
97
+ "loss": 0.2744,
98
+ "step": 150
99
+ },
100
+ {
101
+ "epoch": 0.55,
102
+ "learning_rate": 3.620689655172414e-05,
103
+ "loss": 0.2634,
104
+ "step": 160
105
+ },
106
+ {
107
+ "epoch": 0.59,
108
+ "learning_rate": 3.53448275862069e-05,
109
+ "loss": 0.2813,
110
+ "step": 170
111
+ },
112
+ {
113
+ "epoch": 0.62,
114
+ "learning_rate": 3.4482758620689657e-05,
115
+ "loss": 0.2948,
116
+ "step": 180
117
+ },
118
+ {
119
+ "epoch": 0.66,
120
+ "learning_rate": 3.3620689655172414e-05,
121
+ "loss": 0.28,
122
+ "step": 190
123
+ },
124
+ {
125
+ "epoch": 0.69,
126
+ "learning_rate": 3.275862068965517e-05,
127
+ "loss": 0.2003,
128
+ "step": 200
129
+ },
130
+ {
131
+ "epoch": 0.72,
132
+ "learning_rate": 3.1896551724137935e-05,
133
+ "loss": 0.2322,
134
+ "step": 210
135
+ },
136
+ {
137
+ "epoch": 0.76,
138
+ "learning_rate": 3.103448275862069e-05,
139
+ "loss": 0.3084,
140
+ "step": 220
141
+ },
142
+ {
143
+ "epoch": 0.79,
144
+ "learning_rate": 3.017241379310345e-05,
145
+ "loss": 0.3097,
146
+ "step": 230
147
+ },
148
+ {
149
+ "epoch": 0.83,
150
+ "learning_rate": 2.9310344827586206e-05,
151
+ "loss": 0.2311,
152
+ "step": 240
153
+ },
154
+ {
155
+ "epoch": 0.86,
156
+ "learning_rate": 2.844827586206897e-05,
157
+ "loss": 0.28,
158
+ "step": 250
159
+ },
160
+ {
161
+ "epoch": 0.9,
162
+ "learning_rate": 2.7586206896551727e-05,
163
+ "loss": 0.2528,
164
+ "step": 260
165
+ },
166
+ {
167
+ "epoch": 0.93,
168
+ "learning_rate": 2.672413793103448e-05,
169
+ "loss": 0.3334,
170
+ "step": 270
171
+ },
172
+ {
173
+ "epoch": 0.97,
174
+ "learning_rate": 2.5862068965517244e-05,
175
+ "loss": 0.2705,
176
+ "step": 280
177
+ },
178
+ {
179
+ "epoch": 1.0,
180
+ "learning_rate": 2.5e-05,
181
+ "loss": 0.2501,
182
+ "step": 290
183
+ },
184
+ {
185
+ "epoch": 1.0,
186
+ "eval_accuracy": 0.9507272727272728,
187
+ "eval_loss": 0.19648206233978271,
188
+ "eval_runtime": 2253.6221,
189
+ "eval_samples_per_second": 2.441,
190
+ "eval_steps_per_second": 0.076,
191
+ "step": 290
192
+ }
193
+ ],
194
+ "max_steps": 580,
195
+ "num_train_epochs": 2,
196
+ "total_flos": 5.04847347766272e+17,
197
+ "trial_name": null,
198
+ "trial_params": null
199
+ }
last-checkpoint/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb51e6346c045a349a2c9c36ae9e5384e658b64fbf1dc3fd694f45f501a4d344
3
+ size 3643
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a298a391f6a64a85950144b7d764c9be875cdbf3e07197ec8e9cc8cde0fda74
3
- size 378348457
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec49de05b6d0fc9760a0e4b8496ff8fbf4ceb9ee023b5d568ac0a6f84b39efd8
3
+ size 378349481
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6ce9497385c488a22ae92cb2249699d4cb97b3e82921cf19befde92665fa9b5
3
  size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb51e6346c045a349a2c9c36ae9e5384e658b64fbf1dc3fd694f45f501a4d344
3
  size 3643