Chillarmo commited on
Commit
f4e97ac
·
verified ·
1 Parent(s): 457b309

End of training

Browse files
README.md CHANGED
@@ -1,8 +1,13 @@
1
  ---
2
  library_name: transformers
 
 
3
  license: cc-by-nc-4.0
4
  base_model: facebook/mms-1b-all
5
  tags:
 
 
 
6
  - generated_from_trainer
7
  metrics:
8
  - wer
@@ -16,10 +21,10 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # wav2vec2-common_voice_20-hy-mms-finetune
18
 
19
- This model is a fine-tuned version of [facebook/mms-1b-all](https://huggingface.co/facebook/mms-1b-all) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.1587
22
- - Wer: 0.2464
23
 
24
  ## Model description
25
 
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - na
5
  license: cc-by-nc-4.0
6
  base_model: facebook/mms-1b-all
7
  tags:
8
+ - automatic-speech-recognition
9
+ - Chillarmo/common_voice_20_armenian
10
+ - mms
11
  - generated_from_trainer
12
  metrics:
13
  - wer
 
21
 
22
  # wav2vec2-common_voice_20-hy-mms-finetune
23
 
24
+ This model is a fine-tuned version of [facebook/mms-1b-all](https://huggingface.co/facebook/mms-1b-all) on the CHILLARMO/COMMON_VOICE_20_ARMENIAN - NA dataset.
25
  It achieves the following results on the evaluation set:
26
+ - Loss: 0.1588
27
+ - Wer: 0.2465
28
 
29
  ## Model description
30
 
adapter.hyw.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:572f72044013d84b638eaeb3c356812c0f78e0a9b4d8f7d15a16d700e08aac1e
3
+ size 8947144
all_results.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.0,
3
+ "eval_loss": 0.1587585210800171,
4
+ "eval_runtime": 309.9566,
5
+ "eval_samples": 5856,
6
+ "eval_samples_per_second": 18.893,
7
+ "eval_steps_per_second": 2.362,
8
+ "eval_wer": 0.24645249427110877,
9
+ "total_flos": 2.9809868531482165e+19,
10
+ "train_loss": 0.4726643766093458,
11
+ "train_runtime": 14997.7554,
12
+ "train_samples": 14976,
13
+ "train_samples_per_second": 3.994,
14
+ "train_steps_per_second": 0.125
15
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.0,
3
+ "eval_loss": 0.1587585210800171,
4
+ "eval_runtime": 309.9566,
5
+ "eval_samples": 5856,
6
+ "eval_samples_per_second": 18.893,
7
+ "eval_steps_per_second": 2.362,
8
+ "eval_wer": 0.24645249427110877
9
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.0,
3
+ "total_flos": 2.9809868531482165e+19,
4
+ "train_loss": 0.4726643766093458,
5
+ "train_runtime": 14997.7554,
6
+ "train_samples": 14976,
7
+ "train_samples_per_second": 3.994,
8
+ "train_steps_per_second": 0.125
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,226 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 4.0,
6
+ "eval_steps": 100,
7
+ "global_step": 1872,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.21367521367521367,
14
+ "eval_loss": 0.2269495576620102,
15
+ "eval_runtime": 301.5344,
16
+ "eval_samples_per_second": 19.421,
17
+ "eval_steps_per_second": 2.428,
18
+ "eval_wer": 0.3076194253481403,
19
+ "step": 100
20
+ },
21
+ {
22
+ "epoch": 0.42735042735042733,
23
+ "eval_loss": 0.19151096045970917,
24
+ "eval_runtime": 302.1327,
25
+ "eval_samples_per_second": 19.382,
26
+ "eval_steps_per_second": 2.423,
27
+ "eval_wer": 0.2824343380927199,
28
+ "step": 200
29
+ },
30
+ {
31
+ "epoch": 0.6410256410256411,
32
+ "eval_loss": 0.1993144452571869,
33
+ "eval_runtime": 302.3659,
34
+ "eval_samples_per_second": 19.367,
35
+ "eval_steps_per_second": 2.421,
36
+ "eval_wer": 0.296448087431694,
37
+ "step": 300
38
+ },
39
+ {
40
+ "epoch": 0.8547008547008547,
41
+ "eval_loss": 0.18319852650165558,
42
+ "eval_runtime": 303.1213,
43
+ "eval_samples_per_second": 19.319,
44
+ "eval_steps_per_second": 2.415,
45
+ "eval_wer": 0.2734884540807333,
46
+ "step": 400
47
+ },
48
+ {
49
+ "epoch": 1.0683760683760684,
50
+ "grad_norm": 0.8244175314903259,
51
+ "learning_rate": 0.0007748306997742663,
52
+ "loss": 0.9965,
53
+ "step": 500
54
+ },
55
+ {
56
+ "epoch": 1.0683760683760684,
57
+ "eval_loss": 0.1763978898525238,
58
+ "eval_runtime": 304.6466,
59
+ "eval_samples_per_second": 19.222,
60
+ "eval_steps_per_second": 2.403,
61
+ "eval_wer": 0.26493918561607616,
62
+ "step": 500
63
+ },
64
+ {
65
+ "epoch": 1.282051282051282,
66
+ "eval_loss": 0.17325642704963684,
67
+ "eval_runtime": 304.5973,
68
+ "eval_samples_per_second": 19.225,
69
+ "eval_steps_per_second": 2.403,
70
+ "eval_wer": 0.2625154239379517,
71
+ "step": 600
72
+ },
73
+ {
74
+ "epoch": 1.4957264957264957,
75
+ "eval_loss": 0.17252753674983978,
76
+ "eval_runtime": 305.7799,
77
+ "eval_samples_per_second": 19.151,
78
+ "eval_steps_per_second": 2.394,
79
+ "eval_wer": 0.25918826017979907,
80
+ "step": 700
81
+ },
82
+ {
83
+ "epoch": 1.7094017094017095,
84
+ "eval_loss": 0.17061175405979156,
85
+ "eval_runtime": 306.9826,
86
+ "eval_samples_per_second": 19.076,
87
+ "eval_steps_per_second": 2.385,
88
+ "eval_wer": 0.25806451612903225,
89
+ "step": 800
90
+ },
91
+ {
92
+ "epoch": 1.9230769230769231,
93
+ "eval_loss": 0.16809020936489105,
94
+ "eval_runtime": 306.5557,
95
+ "eval_samples_per_second": 19.103,
96
+ "eval_steps_per_second": 2.388,
97
+ "eval_wer": 0.25854926846465714,
98
+ "step": 900
99
+ },
100
+ {
101
+ "epoch": 2.1367521367521367,
102
+ "grad_norm": 0.886053204536438,
103
+ "learning_rate": 0.0004926636568848759,
104
+ "loss": 0.2922,
105
+ "step": 1000
106
+ },
107
+ {
108
+ "epoch": 2.1367521367521367,
109
+ "eval_loss": 0.16939426958560944,
110
+ "eval_runtime": 308.102,
111
+ "eval_samples_per_second": 19.007,
112
+ "eval_steps_per_second": 2.376,
113
+ "eval_wer": 0.2590560549973559,
114
+ "step": 1000
115
+ },
116
+ {
117
+ "epoch": 2.3504273504273505,
118
+ "eval_loss": 0.17009997367858887,
119
+ "eval_runtime": 307.4896,
120
+ "eval_samples_per_second": 19.045,
121
+ "eval_steps_per_second": 2.381,
122
+ "eval_wer": 0.25753569539925963,
123
+ "step": 1100
124
+ },
125
+ {
126
+ "epoch": 2.564102564102564,
127
+ "eval_loss": 0.17012837529182434,
128
+ "eval_runtime": 308.404,
129
+ "eval_samples_per_second": 18.988,
130
+ "eval_steps_per_second": 2.374,
131
+ "eval_wer": 0.2613916798871849,
132
+ "step": 1200
133
+ },
134
+ {
135
+ "epoch": 2.7777777777777777,
136
+ "eval_loss": 0.16536183655261993,
137
+ "eval_runtime": 307.6932,
138
+ "eval_samples_per_second": 19.032,
139
+ "eval_steps_per_second": 2.379,
140
+ "eval_wer": 0.25354750572889123,
141
+ "step": 1300
142
+ },
143
+ {
144
+ "epoch": 2.9914529914529915,
145
+ "eval_loss": 0.16437660157680511,
146
+ "eval_runtime": 307.9587,
147
+ "eval_samples_per_second": 19.016,
148
+ "eval_steps_per_second": 2.377,
149
+ "eval_wer": 0.2516525647805394,
150
+ "step": 1400
151
+ },
152
+ {
153
+ "epoch": 3.2051282051282053,
154
+ "grad_norm": 0.9470628499984741,
155
+ "learning_rate": 0.00021049661399548533,
156
+ "loss": 0.2788,
157
+ "step": 1500
158
+ },
159
+ {
160
+ "epoch": 3.2051282051282053,
161
+ "eval_loss": 0.1636321097612381,
162
+ "eval_runtime": 308.3318,
163
+ "eval_samples_per_second": 18.993,
164
+ "eval_steps_per_second": 2.374,
165
+ "eval_wer": 0.2539881896703684,
166
+ "step": 1500
167
+ },
168
+ {
169
+ "epoch": 3.4188034188034186,
170
+ "eval_loss": 0.16157202422618866,
171
+ "eval_runtime": 307.8619,
172
+ "eval_samples_per_second": 19.022,
173
+ "eval_steps_per_second": 2.378,
174
+ "eval_wer": 0.2511678124449145,
175
+ "step": 1600
176
+ },
177
+ {
178
+ "epoch": 3.6324786324786325,
179
+ "eval_loss": 0.1600475162267685,
180
+ "eval_runtime": 308.3358,
181
+ "eval_samples_per_second": 18.992,
182
+ "eval_steps_per_second": 2.374,
183
+ "eval_wer": 0.24702538339502908,
184
+ "step": 1700
185
+ },
186
+ {
187
+ "epoch": 3.8461538461538463,
188
+ "eval_loss": 0.15865576267242432,
189
+ "eval_runtime": 309.7473,
190
+ "eval_samples_per_second": 18.906,
191
+ "eval_steps_per_second": 2.363,
192
+ "eval_wer": 0.2464304600740349,
193
+ "step": 1800
194
+ },
195
+ {
196
+ "epoch": 4.0,
197
+ "step": 1872,
198
+ "total_flos": 2.9809868531482165e+19,
199
+ "train_loss": 0.4726643766093458,
200
+ "train_runtime": 14997.7554,
201
+ "train_samples_per_second": 3.994,
202
+ "train_steps_per_second": 0.125
203
+ }
204
+ ],
205
+ "logging_steps": 500,
206
+ "max_steps": 1872,
207
+ "num_input_tokens_seen": 0,
208
+ "num_train_epochs": 4,
209
+ "save_steps": 200,
210
+ "stateful_callbacks": {
211
+ "TrainerControl": {
212
+ "args": {
213
+ "should_epoch_stop": false,
214
+ "should_evaluate": false,
215
+ "should_log": false,
216
+ "should_save": true,
217
+ "should_training_stop": true
218
+ },
219
+ "attributes": {}
220
+ }
221
+ },
222
+ "total_flos": 2.9809868531482165e+19,
223
+ "train_batch_size": 32,
224
+ "trial_name": null,
225
+ "trial_params": null
226
+ }