huseinzol05 commited on
Commit
35de8b9
·
1 Parent(s): 01b191d

Upload model_config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. model_config.yaml +115 -0
model_config.yaml ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ decoder:
2
+ _target_: nemo.collections.asr.modules.SpeakerDecoder
3
+ angular: false
4
+ emb_sizes: 256
5
+ feat_in: 1500
6
+ num_classes: 7
7
+ pool_mode: xvector
8
+ encoder:
9
+ _target_: nemo.collections.asr.modules.ConvASREncoder
10
+ activation: relu
11
+ conv_mask: true
12
+ feat_in: 64
13
+ jasper:
14
+ - dilation:
15
+ - 1
16
+ dropout: 0.5
17
+ filters: 512
18
+ kernel:
19
+ - 3
20
+ repeat: 1
21
+ residual: true
22
+ separable: true
23
+ stride:
24
+ - 1
25
+ - dilation:
26
+ - 1
27
+ dropout: 0.5
28
+ filters: 512
29
+ kernel:
30
+ - 7
31
+ repeat: 2
32
+ residual: true
33
+ separable: true
34
+ stride:
35
+ - 1
36
+ - dilation:
37
+ - 1
38
+ dropout: 0.5
39
+ filters: 512
40
+ kernel:
41
+ - 11
42
+ repeat: 2
43
+ residual: true
44
+ separable: true
45
+ stride:
46
+ - 1
47
+ - dilation:
48
+ - 1
49
+ dropout: 0.5
50
+ filters: 512
51
+ kernel:
52
+ - 15
53
+ repeat: 2
54
+ residual: true
55
+ separable: true
56
+ stride:
57
+ - 1
58
+ - dilation:
59
+ - 1
60
+ dropout: 0.0
61
+ filters: 1500
62
+ kernel:
63
+ - 1
64
+ repeat: 1
65
+ residual: false
66
+ separable: true
67
+ stride:
68
+ - 1
69
+ loss:
70
+ margin: 0.2
71
+ scale: 30
72
+ optim:
73
+ lr: 0.006
74
+ momentum: 0.9
75
+ name: sgd
76
+ sched:
77
+ min_lr: 0.0001
78
+ name: CosineAnnealing
79
+ warmup_ratio: 0.1
80
+ weight_decay: 0.001
81
+ preprocessor:
82
+ _target_: nemo.collections.asr.modules.AudioToMelSpectrogramPreprocessor
83
+ dither: 1.0e-05
84
+ features: 64
85
+ frame_splicing: 1
86
+ n_fft: 512
87
+ normalize: per_feature
88
+ sample_rate: 16000
89
+ stft_conv: false
90
+ window: hann
91
+ window_size: 0.02
92
+ window_stride: 0.01
93
+ target: nemo.collections.asr.models.label_models.EncDecSpeakerLabelModel
94
+ train_ds:
95
+ augmentor:
96
+ noise:
97
+ manifest_path: /ws/manifests/raid/musan/musan_music_noise_manifest_dur8.json
98
+ max_snr_db: 15
99
+ min_snr_db: 5
100
+ prob: 0.2
101
+ batch_size: 64
102
+ labels: null
103
+ manifest_filepath: /ws/manifests/raid/combined/train_manifest.json
104
+ num_workers: 4
105
+ sample_rate: 16000
106
+ shuffle: true
107
+ time_length: 8
108
+ validation_ds:
109
+ batch_size: 64
110
+ labels: null
111
+ manifest_filepath: /ws/manifests/raid/voxceleb/small_manifest.json
112
+ num_workers: 1
113
+ sample_rate: 16000
114
+ shuffle: false
115
+ time_length: 8