poyu39 commited on
Commit
4219f23
·
verified ·
1 Parent(s): 0e21fe4

Upload ./wav2vec2_conformer_base_librispeech.yaml with huggingface_hub

Browse files
wav2vec2_conformer_base_librispeech.yaml ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # @package _group_
2
+
3
+ common:
4
+ fp16: true
5
+ log_format: json
6
+ log_interval: 200
7
+
8
+ checkpoint:
9
+ save_interval_updates: 25000
10
+ keep_interval_updates: 1
11
+ no_epoch_checkpoints: true
12
+
13
+ task:
14
+ _name: audio_pretraining
15
+ data: ???
16
+ max_sample_size: 250000
17
+ min_sample_size: 32000
18
+ normalize: false
19
+
20
+ dataset:
21
+ num_workers: 12
22
+ max_tokens: 400000
23
+ skip_invalid_size_inputs_valid_test: true
24
+
25
+ distributed_training:
26
+ distributed_world_size: 1
27
+ ddp_backend: legacy_ddp
28
+
29
+ criterion:
30
+ _name: wav2vec
31
+ infonce: true
32
+ log_keys: ["prob_perplexity","code_perplexity","temp"]
33
+ loss_weights: [0.1, 10]
34
+
35
+ optimization:
36
+ max_update: 400000
37
+ lr: [0.0005]
38
+ update_freq: [3]
39
+
40
+ optimizer:
41
+ _name: adam
42
+ adam_betas: (0.9,0.98)
43
+ adam_eps: 1e-06
44
+ weight_decay: 0.01
45
+
46
+ lr_scheduler:
47
+ _name: polynomial_decay
48
+ warmup_updates: 32000
49
+
50
+ model:
51
+ _name: wav2vec2
52
+ quantize_targets: true
53
+ final_dim: 256
54
+ encoder_layerdrop: 0.05
55
+ dropout_input: 0.1
56
+ dropout_features: 0.1
57
+ feature_grad_mult: 0.1
58
+
59
+ encoder_layers: 12
60
+ encoder_embed_dim: 768
61
+ encoder_ffn_embed_dim: 3072
62
+ encoder_attention_heads: 12
63
+
64
+ layer_type: conformer
65
+ attn_type: espnet
66
+ pos_enc_type: rel_pos