saurabhk0322 commited on
Commit
aed40d2
·
verified ·
1 Parent(s): e166ba4

Delete exp/asru25/exp_large

Browse files
Files changed (20) hide show
  1. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/RESULTS.md +0 -27
  2. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/config.yaml +0 -511
  3. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/acc.png +0 -0
  4. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/backward_time.png +0 -0
  5. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/cer.png +0 -0
  6. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/cer_ctc.png +0 -0
  7. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/clip.png +0 -0
  8. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/forward_time.png +0 -0
  9. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/gpu_max_cached_mem_GB.png +0 -0
  10. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/grad_norm.png +0 -0
  11. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/iter_time.png +0 -0
  12. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/loss.png +0 -0
  13. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/loss_att.png +0 -0
  14. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/loss_ctc.png +0 -0
  15. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/loss_scale.png +0 -0
  16. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/optim0_lr0.png +0 -0
  17. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/optim_step_time.png +0 -0
  18. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/train_time.png +0 -0
  19. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/wer.png +0 -0
  20. exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/valid.acc.ave_5best.pth +0 -3
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/RESULTS.md DELETED
@@ -1,27 +0,0 @@
1
- <!-- Generated by scripts/utils/show_asr_result.sh -->
2
- # RESULTS
3
- ## Environments
4
- - date: `Wed Apr 23 00:04:53 IST 2025`
5
- - python version: `3.10.12 (main, Feb 4 2025, 14:57:36) [GCC 11.4.0]`
6
- - espnet version: `espnet 202503`
7
- - pytorch version: `pytorch 2.3.0+cu121`
8
- - Git hash: `0cc9d62673c1461efe37632aeab297a311bcd7f0`
9
- - Commit date: `Sat Apr 12 17:53:44 2025 -0400`
10
-
11
- ## exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/decode_lid_asr_model_valid.acc.ave
12
- ### WER
13
-
14
- |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
15
- |---|---|---|---|---|---|---|---|---|
16
- |org/dev_lid|11507|111296|85.3|13.6|1.1|1.0|15.7|67.6|
17
-
18
- ### CER
19
-
20
- |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
21
- |---|---|---|---|---|---|---|---|---|
22
- |org/dev_lid|11507|615241|97.3|1.6|1.0|0.9|3.5|67.6|
23
-
24
- ### TER
25
-
26
- |dataset|Snt|Wrd|Corr|Sub|Del|Ins|Err|S.Err|
27
- |---|---|---|---|---|---|---|---|---|
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/config.yaml DELETED
@@ -1,511 +0,0 @@
1
- config: conf/tuning/train_asr_conformer_transformer_e8_linear1024_bs6M_gacc1.yaml
2
- print_config: false
3
- log_level: INFO
4
- drop_last_iter: false
5
- dry_run: false
6
- iterator_type: sequence
7
- valid_iterator_type: null
8
- output_dir: asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03
9
- ngpu: 1
10
- seed: 2022
11
- num_workers: 8
12
- num_att_plot: 3
13
- dist_backend: nccl
14
- dist_init_method: env://
15
- dist_world_size: null
16
- dist_rank: null
17
- local_rank: 0
18
- dist_master_addr: null
19
- dist_master_port: null
20
- dist_launcher: null
21
- multiprocessing_distributed: false
22
- unused_parameters: false
23
- sharded_ddp: false
24
- use_deepspeed: false
25
- deepspeed_config: null
26
- gradient_as_bucket_view: true
27
- ddp_comm_hook: null
28
- cudnn_enabled: true
29
- cudnn_benchmark: false
30
- cudnn_deterministic: true
31
- use_tf32: false
32
- collect_stats: false
33
- write_collected_feats: false
34
- max_epoch: 70
35
- patience: 5
36
- val_scheduler_criterion:
37
- - valid
38
- - loss
39
- early_stopping_criterion:
40
- - valid
41
- - loss
42
- - min
43
- best_model_criterion:
44
- - - valid
45
- - acc
46
- - max
47
- keep_nbest_models: 5
48
- nbest_averaging_interval: 0
49
- grad_clip: 5.0
50
- grad_clip_type: 2.0
51
- grad_noise: false
52
- accum_grad: 1
53
- no_forward_run: false
54
- resume: true
55
- train_dtype: float32
56
- use_amp: true
57
- log_interval: null
58
- use_matplotlib: true
59
- use_tensorboard: true
60
- create_graph_in_tensorboard: false
61
- use_wandb: false
62
- wandb_project: null
63
- wandb_id: null
64
- wandb_entity: null
65
- wandb_name: null
66
- wandb_model_log_interval: -1
67
- detect_anomaly: false
68
- use_adapter: false
69
- adapter: lora
70
- save_strategy: all
71
- adapter_conf: {}
72
- pretrain_path: null
73
- init_param: []
74
- ignore_init_mismatch: false
75
- freeze_param: []
76
- num_iters_per_epoch: null
77
- batch_size: 20
78
- valid_batch_size: null
79
- batch_bins: 6000000
80
- valid_batch_bins: null
81
- category_sample_size: 10
82
- train_shape_file:
83
- - exp/asru25/exp_large/asr_stats_raw_multilingual_char_sp/train/speech_shape
84
- - exp/asru25/exp_large/asr_stats_raw_multilingual_char_sp/train/text_shape.char
85
- valid_shape_file:
86
- - exp/asru25/exp_large/asr_stats_raw_multilingual_char_sp/valid/speech_shape
87
- - exp/asru25/exp_large/asr_stats_raw_multilingual_char_sp/valid/text_shape.char
88
- batch_type: numel
89
- valid_batch_type: null
90
- fold_length:
91
- - 80000
92
- - 150
93
- sort_in_batch: descending
94
- shuffle_within_batch: false
95
- sort_batch: descending
96
- multiple_iterator: false
97
- chunk_length: 500
98
- chunk_shift_ratio: 0.5
99
- num_cache_chunks: 1024
100
- chunk_excluded_key_prefixes: []
101
- chunk_default_fs: null
102
- chunk_max_abs_length: null
103
- chunk_discard_short_samples: true
104
- train_data_path_and_name_and_type:
105
- - - dump/asru25/large/raw/train_large_lid_sp/wav.scp
106
- - speech
107
- - sound
108
- - - dump/asru25/large/raw/train_large_lid_sp/text
109
- - text
110
- - text
111
- valid_data_path_and_name_and_type:
112
- - - dump/asru25/large/raw/dev_lid/wav.scp
113
- - speech
114
- - sound
115
- - - dump/asru25/large/raw/dev_lid/text
116
- - text
117
- - text
118
- multi_task_dataset: false
119
- allow_variable_data_keys: false
120
- max_cache_size: 0.0
121
- max_cache_fd: 32
122
- allow_multi_rates: false
123
- valid_max_cache_size: null
124
- exclude_weight_decay: false
125
- exclude_weight_decay_conf: {}
126
- optim: adam
127
- optim_conf:
128
- lr: 0.002
129
- weight_decay: 1.0e-06
130
- scheduler: warmuplr
131
- scheduler_conf:
132
- warmup_steps: 15000
133
- token_list:
134
- - <blank>
135
- - <unk>
136
- - <space>
137
- - ा
138
- - क
139
- - े
140
- - र
141
- - ल
142
- - न
143
- - स
144
- - ्
145
- - त
146
- - '['
147
- - ']'
148
- - म
149
- - ी
150
- - ि
151
- - ್
152
- - ह
153
- - य
154
- - ब
155
- - प
156
- - ो
157
- - ్
158
- - া
159
- - व
160
- - ज
161
- - ं
162
- - ు
163
- - ా
164
- - ి
165
- - ಿ
166
- - ে
167
- - ಾ
168
- - द
169
- - র
170
- - న
171
- - ల
172
- - ग
173
- - ರ
174
- - m
175
- - ం
176
- - క
177
- - ক
178
- - ర
179
- - ು
180
- - ನ
181
- - ্
182
- - ಕ
183
- - ु
184
- - च
185
- - ट
186
- - ತ
187
- - ै
188
- - ದ
189
- - ি
190
- - ख
191
- - ೆ
192
- - ಗ
193
- - t
194
- - ప
195
- - త
196
- - b
197
- - h
198
- - इ
199
- - अ
200
- - n
201
- - आ
202
- - ू
203
- - ন
204
- - ಸ
205
- - ಲ
206
- - వ
207
- - ట
208
- - స
209
- - ವ
210
- - ే
211
- - छ
212
- - ব
213
- - ল
214
- - ಯ
215
- - भ
216
- - श
217
- - ಂ
218
- - ಮ
219
- - య
220
- - য
221
- - ध
222
- - డ
223
- - ద
224
- - ए
225
- - थ
226
- - మ
227
- - ಬ
228
- - చ
229
- - ण
230
- - ड
231
- - ম
232
- - ई
233
- - उ
234
- - স
235
- - ত
236
- - ಳ
237
- - ో
238
- - ಡ
239
- - फ
240
- - g
241
- - r
242
- - e
243
- - గ
244
- - প
245
- - ট
246
- - য়
247
- - c
248
- - k
249
- - ಟ
250
- - ె
251
- - .
252
- - ಹ
253
- - ಪ
254
- - ೇ
255
- - బ
256
- - হ
257
- - ু
258
- - দ
259
- - ष
260
- - ো
261
- - ీ
262
- - জ
263
- - ड़
264
- - ಅ
265
- - ೊ
266
- - ই
267
- - গ
268
- - అ
269
- - घ
270
- - ಣ
271
- - ठ
272
- - ೋ
273
- - চ
274
- - ँ
275
- - ొ
276
- - ौ
277
- - ছ
278
- - ఎ
279
- - ओ
280
- - শ
281
- - আ
282
- - ూ
283
- - జ
284
- - ಜ
285
- - থ
286
- - ভ
287
- - ಇ
288
- - ೂ
289
- - ಷ
290
- - ಚ
291
- - এ
292
- - ষ
293
- - ై
294
- - ೀ
295
- - ఉ
296
- - ಎ
297
- - ಆ
298
- - ळ
299
- - ধ
300
- - ृ
301
- - ী
302
- - উ
303
- - ফ
304
- - খ
305
- - ড
306
- - ॉ
307
- - ಶ
308
- - অ
309
- - ೈ
310
- - ధ
311
- - ং
312
- - झ
313
- - ఇ
314
- - ఆ
315
- - ష
316
- - ढ
317
- - ढ़
318
- - భ
319
- - శ
320
- - ఏ
321
- - ಧ
322
- - ও
323
- - ಒ
324
- - ಭ
325
- - ళ
326
- - ಉ
327
- - ॅ
328
- - ಫ
329
- - ऊ
330
- - ఫ
331
- - ಥ
332
- - ऑ
333
- - ణ
334
- - ড়
335
- - ণ
336
- - ঙ
337
- - ऋ
338
- - ಖ
339
- - ऽ
340
- - హ
341
- - థ
342
- - औ
343
- - ೃ
344
- - ঁ
345
- - ೌ
346
- - ఒ
347
- - ఖ
348
- - ৃ
349
- - ఈ
350
- - ಏ
351
- - ঠ
352
- - ౌ
353
- - ಐ
354
- - ৈ
355
- - ऐ
356
- - ऱ
357
- - ఐ
358
- - ূ
359
- - ञ
360
- - ৎ
361
- - ృ
362
- - ज़
363
- - ঞ
364
- - ಈ
365
- - ঘ
366
- - ঋ
367
- - ঝ
368
- - फ़
369
- - ৌ
370
- - ಠ
371
- - ः
372
- - ఓ
373
- - ಘ
374
- - ಛ
375
- - ಓ
376
- - ఊ
377
- - ఋ
378
- - ಔ
379
- - ఛ
380
- - ಞ
381
- - ॲ
382
- - ಊ
383
- - ఘ
384
- - ঢ
385
- - ख़
386
- - ়
387
- - ऍ
388
- - ಋ
389
- - क़
390
- - ఠ
391
- - ঢ়
392
- - ঃ
393
- - ़
394
- - ೕ
395
- - ఔ
396
- - ಢ
397
- - ঊ
398
- - ఱ
399
- - ಃ
400
- - ಝ
401
- - ङ
402
- - ఢ
403
- - ग़
404
- - ఞ
405
- - ঐ
406
- - ঔ
407
- - ॠ
408
- - ':'
409
- - ೯
410
- - ೖ
411
- - ঈ
412
- - ః
413
- - ౖ
414
- - ৠ
415
- - ౦
416
- - <sos/eos>
417
- init: null
418
- input_size: null
419
- ctc_conf:
420
- dropout_rate: 0.0
421
- ctc_type: builtin
422
- reduce: true
423
- ignore_nan_grad: null
424
- zero_infinity: true
425
- brctc_risk_strategy: exp
426
- brctc_group_strategy: end
427
- brctc_risk_factor: 0.0
428
- joint_net_conf: null
429
- use_preprocessor: true
430
- use_lang_prompt: false
431
- use_nlp_prompt: false
432
- token_type: char
433
- bpemodel: null
434
- non_linguistic_symbols: data_respin/data_asru25/nlsyms.txt
435
- cleaner: null
436
- g2p: null
437
- speech_volume_normalize: null
438
- rir_scp: null
439
- rir_apply_prob: 1.0
440
- noise_scp: null
441
- noise_apply_prob: 1.0
442
- noise_db_range: '13_15'
443
- short_noise_thres: 0.5
444
- aux_ctc_tasks: []
445
- frontend: default
446
- frontend_conf:
447
- n_fft: 512
448
- win_length: 400
449
- hop_length: 160
450
- fs: 16k
451
- specaug: specaug
452
- specaug_conf:
453
- apply_time_warp: true
454
- time_warp_window: 5
455
- time_warp_mode: bicubic
456
- apply_freq_mask: true
457
- freq_mask_width_range:
458
- - 0
459
- - 27
460
- num_freq_mask: 2
461
- apply_time_mask: true
462
- time_mask_width_ratio_range:
463
- - 0.0
464
- - 0.05
465
- num_time_mask: 5
466
- normalize: utterance_mvn
467
- normalize_conf: {}
468
- model: espnet
469
- model_conf:
470
- ctc_weight: 0.3
471
- lsm_weight: 0.1
472
- length_normalized_loss: false
473
- preencoder: null
474
- preencoder_conf: {}
475
- encoder: conformer
476
- encoder_conf:
477
- output_size: 256
478
- attention_heads: 4
479
- linear_units: 1024
480
- num_blocks: 8
481
- dropout_rate: 0.1
482
- positional_dropout_rate: 0.1
483
- attention_dropout_rate: 0.1
484
- input_layer: conv2d2
485
- normalize_before: true
486
- macaron_style: true
487
- rel_pos_type: latest
488
- pos_enc_layer_type: rel_pos
489
- selfattention_layer_type: rel_selfattn
490
- activation_type: swish
491
- use_cnn_module: true
492
- cnn_module_kernel: 31
493
- postencoder: null
494
- postencoder_conf: {}
495
- decoder: transformer
496
- decoder_conf:
497
- attention_heads: 4
498
- linear_units: 2048
499
- num_blocks: 6
500
- dropout_rate: 0.1
501
- positional_dropout_rate: 0.1
502
- self_attention_dropout_rate: 0.1
503
- src_attention_dropout_rate: 0.1
504
- layer_drop_rate: 0.0
505
- preprocessor: default
506
- preprocessor_conf: {}
507
- required:
508
- - output_dir
509
- - token_list
510
- version: '202503'
511
- distributed: false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/acc.png DELETED
Binary file (30.8 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/backward_time.png DELETED
Binary file (34.5 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/cer.png DELETED
Binary file (26.9 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/cer_ctc.png DELETED
Binary file (36.5 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/clip.png DELETED
Binary file (14.7 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/forward_time.png DELETED
Binary file (32.9 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/gpu_max_cached_mem_GB.png DELETED
Binary file (34.6 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/grad_norm.png DELETED
Binary file (25.8 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/iter_time.png DELETED
Binary file (36.5 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/loss.png DELETED
Binary file (26.1 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/loss_att.png DELETED
Binary file (28.7 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/loss_ctc.png DELETED
Binary file (29.4 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/loss_scale.png DELETED
Binary file (27.4 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/optim0_lr0.png DELETED
Binary file (29.5 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/optim_step_time.png DELETED
Binary file (26.6 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/train_time.png DELETED
Binary file (30.3 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/images/wer.png DELETED
Binary file (29 kB)
 
exp/asru25/exp_large/asr_multilingual_lid_con_e8_lin1024_bs6M_gacc1_ctc03/valid.acc.ave_5best.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e95fdc2cca38ece938653d8033d2da3729981d780fd931ad56080593d63c5838
3
- size 101971162