detect_language / config.json
apparaomulpuriril's picture
Upload 16 files
d80ea50 verified
{
"_name_or_path": "sanchit-gandhi/whisper-medium-fleurs-lang-id",
"activation_dropout": 0.0,
"activation_function": "gelu",
"apply_spec_augment": false,
"architectures": [
"WhisperForAudioClassification"
],
"attention_dropout": 0.0,
"begin_suppress_tokens": [
220,
50257
],
"bos_token_id": 50257,
"classifier_proj_size": 256,
"d_model": 1024,
"decoder_attention_heads": 16,
"decoder_ffn_dim": 4096,
"decoder_layerdrop": 0.0,
"decoder_layers": 24,
"decoder_start_token_id": 50258,
"dropout": 0.0,
"encoder_attention_heads": 16,
"encoder_ffn_dim": 4096,
"encoder_layerdrop": 0.0,
"encoder_layers": 24,
"eos_token_id": 50257,
"finetuning_task": "audio-classification",
"forced_decoder_ids": [
[
1,
50259
],
[
2,
50359
],
[
3,
50363
]
],
"id2label": {
"0": "Afrikaans",
"1": "Amharic",
"2": "Arabic",
"3": "Assamese",
"4": "Asturian",
"5": "Azerbaijani",
"6": "Belarusian",
"7": "Bulgarian",
"8": "Bengali",
"9": "Bosnian",
"10": "Catalan",
"11": "Cebuano",
"12": "Sorani-Kurdish",
"13": "Mandarin Chinese",
"14": "Czech",
"15": "Welsh",
"16": "Danish",
"17": "German",
"18": "Greek",
"19": "English",
"20": "Spanish",
"21": "Estonian",
"22": "Persian",
"23": "Fula",
"24": "Finnish",
"25": "Filipino",
"26": "French",
"27": "Irish",
"28": "Galician",
"29": "Gujarati",
"30": "Hausa",
"31": "Hebrew",
"32": "Hindi",
"33": "Croatian",
"34": "Hungarian",
"35": "Armenian",
"36": "Indonesian",
"37": "Igbo",
"38": "Icelandic",
"39": "Italian",
"40": "Japanese",
"41": "Javanese",
"42": "Georgian",
"43": "Kamba",
"44": "Kabuverdianu",
"45": "Kazakh",
"46": "Khmer",
"47": "Kannada",
"48": "Korean",
"49": "Kyrgyz",
"50": "Luxembourgish",
"51": "Ganda",
"52": "Lingala",
"53": "Lao",
"54": "Lithuanian",
"55": "Luo",
"56": "Latvian",
"57": "Maori",
"58": "Macedonian",
"59": "Malayalam",
"60": "Mongolian",
"61": "Marathi",
"62": "Malay",
"63": "Maltese",
"64": "Burmese",
"65": "Norwegian",
"66": "Nepali",
"67": "Dutch",
"68": "Northern-Sotho",
"69": "Nyanja",
"70": "Occitan",
"71": "Oromo",
"72": "Oriya",
"73": "Punjabi",
"74": "Polish",
"75": "Pashto",
"76": "Portuguese",
"77": "Romanian",
"78": "Russian",
"79": "Sindhi",
"80": "Slovak",
"81": "Slovenian",
"82": "Shona",
"83": "Somali",
"84": "Serbian",
"85": "Swedish",
"86": "Swahili",
"87": "Tamil",
"88": "Telugu",
"89": "Tajik",
"90": "Thai",
"91": "Turkish",
"92": "Ukrainian",
"93": "Umbundu",
"94": "Urdu",
"95": "Uzbek",
"96": "Vietnamese",
"97": "Wolof",
"98": "Xhosa",
"99": "Yoruba",
"100": "Cantonese Chinese",
"101": "Zulu"
},
"init_std": 0.02,
"is_encoder_decoder": true,
"label2id": {
"Afrikaans": "0",
"Amharic": "1",
"Arabic": "2",
"Armenian": "35",
"Assamese": "3",
"Asturian": "4",
"Azerbaijani": "5",
"Belarusian": "6",
"Bengali": "8",
"Bosnian": "9",
"Bulgarian": "7",
"Burmese": "64",
"Cantonese Chinese": "100",
"Catalan": "10",
"Cebuano": "11",
"Croatian": "33",
"Czech": "14",
"Danish": "16",
"Dutch": "67",
"English": "19",
"Estonian": "21",
"Filipino": "25",
"Finnish": "24",
"French": "26",
"Fula": "23",
"Galician": "28",
"Ganda": "51",
"Georgian": "42",
"German": "17",
"Greek": "18",
"Gujarati": "29",
"Hausa": "30",
"Hebrew": "31",
"Hindi": "32",
"Hungarian": "34",
"Icelandic": "38",
"Igbo": "37",
"Indonesian": "36",
"Irish": "27",
"Italian": "39",
"Japanese": "40",
"Javanese": "41",
"Kabuverdianu": "44",
"Kamba": "43",
"Kannada": "47",
"Kazakh": "45",
"Khmer": "46",
"Korean": "48",
"Kyrgyz": "49",
"Lao": "53",
"Latvian": "56",
"Lingala": "52",
"Lithuanian": "54",
"Luo": "55",
"Luxembourgish": "50",
"Macedonian": "58",
"Malay": "62",
"Malayalam": "59",
"Maltese": "63",
"Mandarin Chinese": "13",
"Maori": "57",
"Marathi": "61",
"Mongolian": "60",
"Nepali": "66",
"Northern-Sotho": "68",
"Norwegian": "65",
"Nyanja": "69",
"Occitan": "70",
"Oriya": "72",
"Oromo": "71",
"Pashto": "75",
"Persian": "22",
"Polish": "74",
"Portuguese": "76",
"Punjabi": "73",
"Romanian": "77",
"Russian": "78",
"Serbian": "84",
"Shona": "82",
"Sindhi": "79",
"Slovak": "80",
"Slovenian": "81",
"Somali": "83",
"Sorani-Kurdish": "12",
"Spanish": "20",
"Swahili": "86",
"Swedish": "85",
"Tajik": "89",
"Tamil": "87",
"Telugu": "88",
"Thai": "90",
"Turkish": "91",
"Ukrainian": "92",
"Umbundu": "93",
"Urdu": "94",
"Uzbek": "95",
"Vietnamese": "96",
"Welsh": "15",
"Wolof": "97",
"Xhosa": "98",
"Yoruba": "99",
"Zulu": "101"
},
"mask_feature_length": 10,
"mask_feature_min_masks": 0,
"mask_feature_prob": 0.0,
"mask_time_length": 10,
"mask_time_min_masks": 2,
"mask_time_prob": 0.05,
"max_length": 448,
"max_source_positions": 1500,
"max_target_positions": 448,
"model_type": "whisper",
"num_hidden_layers": 24,
"num_mel_bins": 80,
"pad_token_id": 50257,
"scale_embedding": false,
"suppress_tokens": [
1,
2,
7,
8,
9,
10,
14,
25,
26,
27,
28,
29,
31,
58,
59,
60,
61,
62,
63,
90,
91,
92,
93,
359,
503,
522,
542,
873,
893,
902,
918,
922,
931,
1350,
1853,
1982,
2460,
2627,
3246,
3253,
3268,
3536,
3846,
3961,
4183,
4667,
6585,
6647,
7273,
9061,
9383,
10428,
10929,
11938,
12033,
12331,
12562,
13793,
14157,
14635,
15265,
15618,
16553,
16604,
18362,
18956,
20075,
21675,
22520,
26130,
26161,
26435,
28279,
29464,
31650,
32302,
32470,
36865,
42863,
47425,
49870,
50254,
50258,
50360,
50361,
50362
],
"torch_dtype": "float16",
"transformers_version": "4.30.0.dev0",
"use_cache": true,
"use_weighted_layer_sum": false,
"vocab_size": 51865
}