# ########################################################################################## # Model: Whisper-large-v3 Encoder + Attion pooling for Arabic Dialect Identification # # Author: Haroun Elleuch ############################################################################################ pretrained_path: Elyadata/ADI-whisper-ADI20 whisper_hub: openai/whisper-large-v3 n_languages: 20 features_dim: 1280 whisper: !new:speechbrain.lobes.models.huggingface_transformers.whisper.Whisper source: !ref encoder_only: True freeze_encoder: False save_path: !ref attention_pooling: !new:speechbrain.nnet.pooling.AttentionPooling input_dim: !ref output_mlp: !new:speechbrain.nnet.linear.Linear input_size: !ref n_neurons: !ref bias: False modules: whisper: !ref attention_pooling: !ref output_mlp: !ref log_softmax: !new:speechbrain.nnet.activations.Softmax apply_log: True label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer loadables: whisper: !ref attention_pooling: !ref output_mlp: !ref label_encoder: !ref paths: whisper: !ref /whisper.ckpt attention_pooling: !ref /attention_pooling.ckpt output_mlp: !ref /output_mlp.ckpt label_encoder: !ref /dialect_encoder.txt