{ "_name_or_path": "sanchit-gandhi/whisper-medium-fleurs-lang-id", "activation_dropout": 0.0, "activation_function": "gelu", "apply_spec_augment": false, "architectures": [ "WhisperForAudioClassification" ], "attention_dropout": 0.0, "begin_suppress_tokens": [ 220, 50257 ], "bos_token_id": 50257, "classifier_proj_size": 256, "d_model": 1024, "decoder_attention_heads": 16, "decoder_ffn_dim": 4096, "decoder_layerdrop": 0.0, "decoder_layers": 24, "decoder_start_token_id": 50258, "dropout": 0.0, "encoder_attention_heads": 16, "encoder_ffn_dim": 4096, "encoder_layerdrop": 0.0, "encoder_layers": 24, "eos_token_id": 50257, "finetuning_task": "audio-classification", "forced_decoder_ids": [ [ 1, 50259 ], [ 2, 50359 ], [ 3, 50363 ] ], "id2label": { "0": "Afrikaans", "1": "Amharic", "2": "Arabic", "3": "Assamese", "4": "Asturian", "5": "Azerbaijani", "6": "Belarusian", "7": "Bulgarian", "8": "Bengali", "9": "Bosnian", "10": "Catalan", "11": "Cebuano", "12": "Sorani-Kurdish", "13": "Mandarin Chinese", "14": "Czech", "15": "Welsh", "16": "Danish", "17": "German", "18": "Greek", "19": "English", "20": "Spanish", "21": "Estonian", "22": "Persian", "23": "Fula", "24": "Finnish", "25": "Filipino", "26": "French", "27": "Irish", "28": "Galician", "29": "Gujarati", "30": "Hausa", "31": "Hebrew", "32": "Hindi", "33": "Croatian", "34": "Hungarian", "35": "Armenian", "36": "Indonesian", "37": "Igbo", "38": "Icelandic", "39": "Italian", "40": "Japanese", "41": "Javanese", "42": "Georgian", "43": "Kamba", "44": "Kabuverdianu", "45": "Kazakh", "46": "Khmer", "47": "Kannada", "48": "Korean", "49": "Kyrgyz", "50": "Luxembourgish", "51": "Ganda", "52": "Lingala", "53": "Lao", "54": "Lithuanian", "55": "Luo", "56": "Latvian", "57": "Maori", "58": "Macedonian", "59": "Malayalam", "60": "Mongolian", "61": "Marathi", "62": "Malay", "63": "Maltese", "64": "Burmese", "65": "Norwegian", "66": "Nepali", "67": "Dutch", "68": "Northern-Sotho", "69": "Nyanja", "70": "Occitan", "71": "Oromo", "72": "Oriya", "73": "Punjabi", "74": "Polish", "75": "Pashto", "76": "Portuguese", "77": "Romanian", "78": "Russian", "79": "Sindhi", "80": "Slovak", "81": "Slovenian", "82": "Shona", "83": "Somali", "84": "Serbian", "85": "Swedish", "86": "Swahili", "87": "Tamil", "88": "Telugu", "89": "Tajik", "90": "Thai", "91": "Turkish", "92": "Ukrainian", "93": "Umbundu", "94": "Urdu", "95": "Uzbek", "96": "Vietnamese", "97": "Wolof", "98": "Xhosa", "99": "Yoruba", "100": "Cantonese Chinese", "101": "Zulu" }, "init_std": 0.02, "is_encoder_decoder": true, "label2id": { "Afrikaans": "0", "Amharic": "1", "Arabic": "2", "Armenian": "35", "Assamese": "3", "Asturian": "4", "Azerbaijani": "5", "Belarusian": "6", "Bengali": "8", "Bosnian": "9", "Bulgarian": "7", "Burmese": "64", "Cantonese Chinese": "100", "Catalan": "10", "Cebuano": "11", "Croatian": "33", "Czech": "14", "Danish": "16", "Dutch": "67", "English": "19", "Estonian": "21", "Filipino": "25", "Finnish": "24", "French": "26", "Fula": "23", "Galician": "28", "Ganda": "51", "Georgian": "42", "German": "17", "Greek": "18", "Gujarati": "29", "Hausa": "30", "Hebrew": "31", "Hindi": "32", "Hungarian": "34", "Icelandic": "38", "Igbo": "37", "Indonesian": "36", "Irish": "27", "Italian": "39", "Japanese": "40", "Javanese": "41", "Kabuverdianu": "44", "Kamba": "43", "Kannada": "47", "Kazakh": "45", "Khmer": "46", "Korean": "48", "Kyrgyz": "49", "Lao": "53", "Latvian": "56", "Lingala": "52", "Lithuanian": "54", "Luo": "55", "Luxembourgish": "50", "Macedonian": "58", "Malay": "62", "Malayalam": "59", "Maltese": "63", "Mandarin Chinese": "13", "Maori": "57", "Marathi": "61", "Mongolian": "60", "Nepali": "66", "Northern-Sotho": "68", "Norwegian": "65", "Nyanja": "69", "Occitan": "70", "Oriya": "72", "Oromo": "71", "Pashto": "75", "Persian": "22", "Polish": "74", "Portuguese": "76", "Punjabi": "73", "Romanian": "77", "Russian": "78", "Serbian": "84", "Shona": "82", "Sindhi": "79", "Slovak": "80", "Slovenian": "81", "Somali": "83", "Sorani-Kurdish": "12", "Spanish": "20", "Swahili": "86", "Swedish": "85", "Tajik": "89", "Tamil": "87", "Telugu": "88", "Thai": "90", "Turkish": "91", "Ukrainian": "92", "Umbundu": "93", "Urdu": "94", "Uzbek": "95", "Vietnamese": "96", "Welsh": "15", "Wolof": "97", "Xhosa": "98", "Yoruba": "99", "Zulu": "101" }, "mask_feature_length": 10, "mask_feature_min_masks": 0, "mask_feature_prob": 0.0, "mask_time_length": 10, "mask_time_min_masks": 2, "mask_time_prob": 0.05, "max_length": 448, "max_source_positions": 1500, "max_target_positions": 448, "model_type": "whisper", "num_hidden_layers": 24, "num_mel_bins": 80, "pad_token_id": 50257, "scale_embedding": false, "suppress_tokens": [ 1, 2, 7, 8, 9, 10, 14, 25, 26, 27, 28, 29, 31, 58, 59, 60, 61, 62, 63, 90, 91, 92, 93, 359, 503, 522, 542, 873, 893, 902, 918, 922, 931, 1350, 1853, 1982, 2460, 2627, 3246, 3253, 3268, 3536, 3846, 3961, 4183, 4667, 6585, 6647, 7273, 9061, 9383, 10428, 10929, 11938, 12033, 12331, 12562, 13793, 14157, 14635, 15265, 15618, 16553, 16604, 18362, 18956, 20075, 21675, 22520, 26130, 26161, 26435, 28279, 29464, 31650, 32302, 32470, 36865, 42863, 47425, 49870, 50254, 50258, 50360, 50361, 50362 ], "torch_dtype": "float16", "transformers_version": "4.30.0.dev0", "use_cache": true, "use_weighted_layer_sum": false, "vocab_size": 51865 }