alkiskoudounas's picture
Upload with huggingface_hub
beb4f6b verified
{
"_name_or_path": "jonatasgrosman/wav2vec2-large-xlsr-53-italian",
"activation_dropout": 0.05,
"adapter_kernel_size": 3,
"adapter_stride": 2,
"add_adapter": false,
"apply_spec_augment": true,
"architectures": [
"Wav2Vec2ForSequenceClassification"
],
"attention_dropout": 0.1,
"bos_token_id": 1,
"classifier_proj_size": 256,
"codevector_dim": 768,
"contrastive_logits_temperature": 0.1,
"conv_bias": true,
"conv_dim": [
512,
512,
512,
512,
512,
512,
512
],
"conv_kernel": [
10,
3,
3,
3,
3,
2,
2
],
"conv_stride": [
5,
2,
2,
2,
2,
2,
2
],
"ctc_loss_reduction": "mean",
"ctc_zero_infinity": true,
"diversity_loss_weight": 0.1,
"do_stable_layer_norm": true,
"eos_token_id": 2,
"feat_extract_activation": "gelu",
"feat_extract_dropout": 0.0,
"feat_extract_norm": "layer",
"feat_proj_dropout": 0.05,
"feat_quantizer_dropout": 0.0,
"final_dropout": 0.0,
"hidden_act": "gelu",
"hidden_dropout": 0.05,
"hidden_size": 1024,
"id2label": {
"0": "cooking_query",
"1": "iot_hue_lightdim",
"10": "news_query",
"11": "music_likeness",
"12": "iot_wemo_off",
"13": "iot_hue_lighton",
"14": "iot_wemo_on",
"15": "iot_coffee",
"16": "social_post",
"17": "qa_maths",
"18": "iot_hue_lightup",
"19": "music_query",
"2": "cooking_recipe",
"20": "transport_taxi",
"21": "qa_stock",
"22": "play_radio",
"23": "play_music",
"24": "audio_volume_up",
"25": "calendar_remove",
"26": "alarm_remove",
"27": "recommendation_locations",
"28": "general_joke",
"29": "email_sendemail",
"3": "email_addcontact",
"30": "audio_volume_mute",
"31": "iot_cleaning",
"32": "social_query",
"33": "play_game",
"34": "recommendation_events",
"35": "alarm_set",
"36": "calendar_set",
"37": "audio_volume_down",
"38": "lists_createoradd",
"39": "calendar_query",
"4": "weather_query",
"40": "general_greet",
"41": "qa_factoid",
"42": "takeaway_order",
"43": "transport_query",
"44": "iot_hue_lightchange",
"45": "play_podcasts",
"46": "transport_ticket",
"47": "qa_definition",
"48": "lists_query",
"49": "email_query",
"5": "takeaway_query",
"50": "datetime_convert",
"51": "iot_hue_lightoff",
"52": "alarm_query",
"53": "audio_volume_other",
"54": "lists_remove",
"55": "datetime_query",
"56": "qa_currency",
"57": "transport_traffic",
"58": "music_dislikeness",
"59": "music_settings",
"6": "email_querycontact",
"7": "play_audiobook",
"8": "recommendation_movies",
"9": "general_quirky"
},
"initializer_range": 0.02,
"intermediate_size": 4096,
"label2id": {
"alarm_query": "52",
"alarm_remove": "26",
"alarm_set": "35",
"audio_volume_down": "37",
"audio_volume_mute": "30",
"audio_volume_other": "53",
"audio_volume_up": "24",
"calendar_query": "39",
"calendar_remove": "25",
"calendar_set": "36",
"cooking_query": "0",
"cooking_recipe": "2",
"datetime_convert": "50",
"datetime_query": "55",
"email_addcontact": "3",
"email_query": "49",
"email_querycontact": "6",
"email_sendemail": "29",
"general_greet": "40",
"general_joke": "28",
"general_quirky": "9",
"iot_cleaning": "31",
"iot_coffee": "15",
"iot_hue_lightchange": "44",
"iot_hue_lightdim": "1",
"iot_hue_lightoff": "51",
"iot_hue_lighton": "13",
"iot_hue_lightup": "18",
"iot_wemo_off": "12",
"iot_wemo_on": "14",
"lists_createoradd": "38",
"lists_query": "48",
"lists_remove": "54",
"music_dislikeness": "58",
"music_likeness": "11",
"music_query": "19",
"music_settings": "59",
"news_query": "10",
"play_audiobook": "7",
"play_game": "33",
"play_music": "23",
"play_podcasts": "45",
"play_radio": "22",
"qa_currency": "56",
"qa_definition": "47",
"qa_factoid": "41",
"qa_maths": "17",
"qa_stock": "21",
"recommendation_events": "34",
"recommendation_locations": "27",
"recommendation_movies": "8",
"social_post": "16",
"social_query": "32",
"takeaway_order": "42",
"takeaway_query": "5",
"transport_query": "43",
"transport_taxi": "20",
"transport_ticket": "46",
"transport_traffic": "57",
"weather_query": "4"
},
"layer_norm_eps": 1e-05,
"layerdrop": 0.05,
"mask_channel_length": 10,
"mask_channel_min_space": 1,
"mask_channel_other": 0.0,
"mask_channel_prob": 0.0,
"mask_channel_selection": "static",
"mask_feature_length": 10,
"mask_feature_min_masks": 0,
"mask_feature_prob": 0.0,
"mask_time_length": 10,
"mask_time_min_masks": 2,
"mask_time_min_space": 1,
"mask_time_other": 0.0,
"mask_time_prob": 0.05,
"mask_time_selection": "static",
"model_type": "wav2vec2",
"num_adapter_layers": 3,
"num_attention_heads": 16,
"num_codevector_groups": 2,
"num_codevectors_per_group": 320,
"num_conv_pos_embedding_groups": 16,
"num_conv_pos_embeddings": 128,
"num_feat_extract_layers": 7,
"num_hidden_layers": 24,
"num_negatives": 100,
"output_hidden_size": 1024,
"pad_token_id": 0,
"proj_codevector_dim": 768,
"tdnn_dilation": [
1,
2,
3,
1,
1
],
"tdnn_dim": [
512,
512,
512,
512,
1500
],
"tdnn_kernel": [
5,
3,
3,
1,
1
],
"torch_dtype": "float32",
"transformers_version": "4.26.0.dev0",
"use_weighted_layer_sum": false,
"vocab_size": 44,
"xvector_output_dim": 512
}