r3gm's picture
v0.5.0
b152010
raw history blame
No virus
23.3 kB
from .logging_setup import logger
LANGUAGES_UNIDIRECTIONAL = {
"Aymara (ay)": "ay",
"Bambara (bm)": "bm",
"Cebuano (ceb)": "ceb",
"Chichewa (ny)": "ny",
"Divehi (dv)": "dv",
"Dogri (doi)": "doi",
"Ewe (ee)": "ee",
"Guarani (gn)": "gn",
"Iloko (ilo)": "ilo",
"Kinyarwanda (rw)": "rw",
"Krio (kri)": "kri",
"Kurdish (ku)": "ku",
"Kirghiz (ky)": "ky",
"Ganda (lg)": "lg",
"Maithili (mai)": "mai",
"Oriya (or)": "or",
"Oromo (om)": "om",
"Quechua (qu)": "qu",
"Samoan (sm)": "sm",
"Tigrinya (ti)": "ti",
"Tsonga (ts)": "ts",
"Akan (ak)": "ak",
"Uighur (ug)": "ug"
}
UNIDIRECTIONAL_L_LIST = LANGUAGES_UNIDIRECTIONAL.keys()
LANGUAGES = {
"Automatic detection": "Automatic detection",
"Arabic (ar)": "ar",
"Chinese - Simplified (zh-CN)": "zh",
"Czech (cs)": "cs",
"Danish (da)": "da",
"Dutch (nl)": "nl",
"English (en)": "en",
"Finnish (fi)": "fi",
"French (fr)": "fr",
"German (de)": "de",
"Greek (el)": "el",
"Hebrew (he)": "he",
"Hungarian (hu)": "hu",
"Italian (it)": "it",
"Japanese (ja)": "ja",
"Korean (ko)": "ko",
"Persian (fa)": "fa", # no aux gTTS
"Polish (pl)": "pl",
"Portuguese (pt)": "pt",
"Russian (ru)": "ru",
"Spanish (es)": "es",
"Turkish (tr)": "tr",
"Ukrainian (uk)": "uk",
"Urdu (ur)": "ur",
"Vietnamese (vi)": "vi",
"Hindi (hi)": "hi",
"Indonesian (id)": "id",
"Bengali (bn)": "bn",
"Telugu (te)": "te",
"Marathi (mr)": "mr",
"Tamil (ta)": "ta",
"Javanese (jw|jv)": "jw",
"Catalan (ca)": "ca",
"Nepali (ne)": "ne",
"Thai (th)": "th",
"Swedish (sv)": "sv",
"Amharic (am)": "am",
"Welsh (cy)": "cy", # no aux gTTS
"Estonian (et)": "et",
"Croatian (hr)": "hr",
"Icelandic (is)": "is",
"Georgian (ka)": "ka", # no aux gTTS
"Khmer (km)": "km",
"Slovak (sk)": "sk",
"Albanian (sq)": "sq",
"Serbian (sr)": "sr",
"Azerbaijani (az)": "az", # no aux gTTS
"Bulgarian (bg)": "bg",
"Galician (gl)": "gl", # no aux gTTS
"Gujarati (gu)": "gu",
"Kazakh (kk)": "kk", # no aux gTTS
"Kannada (kn)": "kn",
"Lithuanian (lt)": "lt", # no aux gTTS
"Latvian (lv)": "lv",
"Macedonian (mk)": "mk", # no aux gTTS # error get align model
"Malayalam (ml)": "ml",
"Malay (ms)": "ms", # error get align model
"Romanian (ro)": "ro",
"Sinhala (si)": "si",
"Sundanese (su)": "su",
"Swahili (sw)": "sw", # error aling
"Afrikaans (af)": "af",
"Bosnian (bs)": "bs",
"Latin (la)": "la",
"Myanmar Burmese (my)": "my",
"Norwegian (no|nb)": "no",
"Chinese - Traditional (zh-TW)": "zh-TW",
"Assamese (as)": "as",
"Basque (eu)": "eu",
"Hausa (ha)": "ha",
"Haitian Creole (ht)": "ht",
"Armenian (hy)": "hy",
"Lao (lo)": "lo",
"Malagasy (mg)": "mg",
"Mongolian (mn)": "mn",
"Maltese (mt)": "mt",
"Punjabi (pa)": "pa",
"Pashto (ps)": "ps",
"Slovenian (sl)": "sl",
"Shona (sn)": "sn",
"Somali (so)": "so",
"Tajik (tg)": "tg",
"Turkmen (tk)": "tk",
"Tatar (tt)": "tt",
"Uzbek (uz)": "uz",
"Yoruba (yo)": "yo",
**LANGUAGES_UNIDIRECTIONAL
}
BASE_L_LIST = LANGUAGES.keys()
LANGUAGES_LIST = [list(BASE_L_LIST)[0]] + sorted(list(BASE_L_LIST)[1:])
INVERTED_LANGUAGES = {value: key for key, value in LANGUAGES.items()}
EXTRA_ALIGN = {
"id": "indonesian-nlp/wav2vec2-large-xlsr-indonesian",
"bn": "arijitx/wav2vec2-large-xlsr-bengali",
"mr": "sumedh/wav2vec2-large-xlsr-marathi",
"ta": "Amrrs/wav2vec2-large-xlsr-53-tamil",
"jw": "cahya/wav2vec2-large-xlsr-javanese",
"ne": "shniranjan/wav2vec2-large-xlsr-300m-nepali",
"th": "sakares/wav2vec2-large-xlsr-thai-demo",
"sv": "KBLab/wav2vec2-large-voxrex-swedish",
"am": "agkphysics/wav2vec2-large-xlsr-53-amharic",
"cy": "Srulikbdd/Wav2Vec2-large-xlsr-welsh",
"et": "anton-l/wav2vec2-large-xlsr-53-estonian",
"hr": "classla/wav2vec2-xls-r-parlaspeech-hr",
"is": "carlosdanielhernandezmena/wav2vec2-large-xlsr-53-icelandic-ep10-1000h",
"ka": "MehdiHosseiniMoghadam/wav2vec2-large-xlsr-53-Georgian",
"km": "vitouphy/wav2vec2-xls-r-300m-khmer",
"sk": "infinitejoy/wav2vec2-large-xls-r-300m-slovak",
"sq": "Alimzhan/wav2vec2-large-xls-r-300m-albanian-colab",
"sr": "dnikolic/wav2vec2-xlsr-530-serbian-colab",
"az": "nijatzeynalov/wav2vec2-large-mms-1b-azerbaijani-common_voice15.0",
"bg": "infinitejoy/wav2vec2-large-xls-r-300m-bulgarian",
"gl": "ifrz/wav2vec2-large-xlsr-galician",
"gu": "Harveenchadha/vakyansh-wav2vec2-gujarati-gnm-100",
"kk": "aismlv/wav2vec2-large-xlsr-kazakh",
"kn": "Harveenchadha/vakyansh-wav2vec2-kannada-knm-560",
"lt": "DeividasM/wav2vec2-large-xlsr-53-lithuanian",
"lv": "anton-l/wav2vec2-large-xlsr-53-latvian",
"mk": "", # Konstantin-Bogdanoski/wav2vec2-macedonian-base
"ml": "gvs/wav2vec2-large-xlsr-malayalam",
"ms": "", # Duy/wav2vec2_malay
"ro": "anton-l/wav2vec2-large-xlsr-53-romanian",
"si": "IAmNotAnanth/wav2vec2-large-xls-r-300m-sinhala",
"su": "cahya/wav2vec2-large-xlsr-sundanese",
"sw": "", # Lians/fine-tune-wav2vec2-large-swahili
"af": "", # ylacombe/wav2vec2-common_voice-af-demo
"bs": "",
"la": "",
"my": "",
"no": "NbAiLab/wav2vec2-xlsr-300m-norwegian",
"zh-TW": "jonatasgrosman/wav2vec2-large-xlsr-53-chinese-zh-cn",
"as": "",
"eu": "", # cahya/wav2vec2-large-xlsr-basque # verify
"ha": "infinitejoy/wav2vec2-large-xls-r-300m-hausa",
"ht": "",
"hy": "infinitejoy/wav2vec2-large-xls-r-300m-armenian", # no (.)
"lo": "",
"mg": "",
"mn": "tugstugi/wav2vec2-large-xlsr-53-mongolian",
"mt": "carlosdanielhernandezmena/wav2vec2-large-xlsr-53-maltese-64h",
"pa": "kingabzpro/wav2vec2-large-xlsr-53-punjabi",
"ps": "aamirhs/wav2vec2-large-xls-r-300m-pashto-colab",
"sl": "anton-l/wav2vec2-large-xlsr-53-slovenian",
"sn": "",
"so": "",
"tg": "",
"tk": "", # Ragav/wav2vec2-tk
"tt": "anton-l/wav2vec2-large-xlsr-53-tatar",
"uz": "", # Mekhriddin/wav2vec2-large-xls-r-300m-uzbek-colab
"yo": "ogbi/wav2vec2-large-mms-1b-yoruba-test",
}
def fix_code_language(translate_to, syntax="google"):
if syntax == "google":
# google-translator, gTTS
replace_lang_code = {"zh": "zh-CN", "he": "iw", "zh-cn": "zh-CN"}
elif syntax == "coqui":
# coqui-xtts
replace_lang_code = {"zh": "zh-cn", "zh-CN": "zh-cn", "zh-TW": "zh-cn"}
new_code_lang = replace_lang_code.get(translate_to, translate_to)
logger.debug(f"Fix code {translate_to} -> {new_code_lang}")
return new_code_lang
BARK_VOICES_LIST = {
"de_speaker_0-Male BARK": "v2/de_speaker_0",
"de_speaker_1-Male BARK": "v2/de_speaker_1",
"de_speaker_2-Male BARK": "v2/de_speaker_2",
"de_speaker_3-Female BARK": "v2/de_speaker_3",
"de_speaker_4-Male BARK": "v2/de_speaker_4",
"de_speaker_5-Male BARK": "v2/de_speaker_5",
"de_speaker_6-Male BARK": "v2/de_speaker_6",
"de_speaker_7-Male BARK": "v2/de_speaker_7",
"de_speaker_8-Female BARK": "v2/de_speaker_8",
"de_speaker_9-Male BARK": "v2/de_speaker_9",
"en_speaker_0-Male BARK": "v2/en_speaker_0",
"en_speaker_1-Male BARK": "v2/en_speaker_1",
"en_speaker_2-Male BARK": "v2/en_speaker_2",
"en_speaker_3-Male BARK": "v2/en_speaker_3",
"en_speaker_4-Male BARK": "v2/en_speaker_4",
"en_speaker_5-Male BARK": "v2/en_speaker_5",
"en_speaker_6-Male BARK": "v2/en_speaker_6",
"en_speaker_7-Male BARK": "v2/en_speaker_7",
"en_speaker_8-Male BARK": "v2/en_speaker_8",
"en_speaker_9-Female BARK": "v2/en_speaker_9",
"es_speaker_0-Male BARK": "v2/es_speaker_0",
"es_speaker_1-Male BARK": "v2/es_speaker_1",
"es_speaker_2-Male BARK": "v2/es_speaker_2",
"es_speaker_3-Male BARK": "v2/es_speaker_3",
"es_speaker_4-Male BARK": "v2/es_speaker_4",
"es_speaker_5-Male BARK": "v2/es_speaker_5",
"es_speaker_6-Male BARK": "v2/es_speaker_6",
"es_speaker_7-Male BARK": "v2/es_speaker_7",
"es_speaker_8-Female BARK": "v2/es_speaker_8",
"es_speaker_9-Female BARK": "v2/es_speaker_9",
"fr_speaker_0-Male BARK": "v2/fr_speaker_0",
"fr_speaker_1-Female BARK": "v2/fr_speaker_1",
"fr_speaker_2-Female BARK": "v2/fr_speaker_2",
"fr_speaker_3-Male BARK": "v2/fr_speaker_3",
"fr_speaker_4-Male BARK": "v2/fr_speaker_4",
"fr_speaker_5-Female BARK": "v2/fr_speaker_5",
"fr_speaker_6-Male BARK": "v2/fr_speaker_6",
"fr_speaker_7-Male BARK": "v2/fr_speaker_7",
"fr_speaker_8-Male BARK": "v2/fr_speaker_8",
"fr_speaker_9-Male BARK": "v2/fr_speaker_9",
"hi_speaker_0-Female BARK": "v2/hi_speaker_0",
"hi_speaker_1-Female BARK": "v2/hi_speaker_1",
"hi_speaker_2-Male BARK": "v2/hi_speaker_2",
"hi_speaker_3-Female BARK": "v2/hi_speaker_3",
"hi_speaker_4-Female BARK": "v2/hi_speaker_4",
"hi_speaker_5-Male BARK": "v2/hi_speaker_5",
"hi_speaker_6-Male BARK": "v2/hi_speaker_6",
"hi_speaker_7-Male BARK": "v2/hi_speaker_7",
"hi_speaker_8-Male BARK": "v2/hi_speaker_8",
"hi_speaker_9-Female BARK": "v2/hi_speaker_9",
"it_speaker_0-Male BARK": "v2/it_speaker_0",
"it_speaker_1-Male BARK": "v2/it_speaker_1",
"it_speaker_2-Female BARK": "v2/it_speaker_2",
"it_speaker_3-Male BARK": "v2/it_speaker_3",
"it_speaker_4-Male BARK": "v2/it_speaker_4",
"it_speaker_5-Male BARK": "v2/it_speaker_5",
"it_speaker_6-Male BARK": "v2/it_speaker_6",
"it_speaker_7-Female BARK": "v2/it_speaker_7",
"it_speaker_8-Male BARK": "v2/it_speaker_8",
"it_speaker_9-Female BARK": "v2/it_speaker_9",
"ja_speaker_0-Female BARK": "v2/ja_speaker_0",
"ja_speaker_1-Female BARK": "v2/ja_speaker_1",
"ja_speaker_2-Male BARK": "v2/ja_speaker_2",
"ja_speaker_3-Female BARK": "v2/ja_speaker_3",
"ja_speaker_4-Female BARK": "v2/ja_speaker_4",
"ja_speaker_5-Female BARK": "v2/ja_speaker_5",
"ja_speaker_6-Male BARK": "v2/ja_speaker_6",
"ja_speaker_7-Female BARK": "v2/ja_speaker_7",
"ja_speaker_8-Female BARK": "v2/ja_speaker_8",
"ja_speaker_9-Female BARK": "v2/ja_speaker_9",
"ko_speaker_0-Female BARK": "v2/ko_speaker_0",
"ko_speaker_1-Male BARK": "v2/ko_speaker_1",
"ko_speaker_2-Male BARK": "v2/ko_speaker_2",
"ko_speaker_3-Male BARK": "v2/ko_speaker_3",
"ko_speaker_4-Male BARK": "v2/ko_speaker_4",
"ko_speaker_5-Male BARK": "v2/ko_speaker_5",
"ko_speaker_6-Male BARK": "v2/ko_speaker_6",
"ko_speaker_7-Male BARK": "v2/ko_speaker_7",
"ko_speaker_8-Male BARK": "v2/ko_speaker_8",
"ko_speaker_9-Male BARK": "v2/ko_speaker_9",
"pl_speaker_0-Male BARK": "v2/pl_speaker_0",
"pl_speaker_1-Male BARK": "v2/pl_speaker_1",
"pl_speaker_2-Male BARK": "v2/pl_speaker_2",
"pl_speaker_3-Male BARK": "v2/pl_speaker_3",
"pl_speaker_4-Female BARK": "v2/pl_speaker_4",
"pl_speaker_5-Male BARK": "v2/pl_speaker_5",
"pl_speaker_6-Female BARK": "v2/pl_speaker_6",
"pl_speaker_7-Male BARK": "v2/pl_speaker_7",
"pl_speaker_8-Male BARK": "v2/pl_speaker_8",
"pl_speaker_9-Female BARK": "v2/pl_speaker_9",
"pt_speaker_0-Male BARK": "v2/pt_speaker_0",
"pt_speaker_1-Male BARK": "v2/pt_speaker_1",
"pt_speaker_2-Male BARK": "v2/pt_speaker_2",
"pt_speaker_3-Male BARK": "v2/pt_speaker_3",
"pt_speaker_4-Male BARK": "v2/pt_speaker_4",
"pt_speaker_5-Male BARK": "v2/pt_speaker_5",
"pt_speaker_6-Male BARK": "v2/pt_speaker_6",
"pt_speaker_7-Male BARK": "v2/pt_speaker_7",
"pt_speaker_8-Male BARK": "v2/pt_speaker_8",
"pt_speaker_9-Male BARK": "v2/pt_speaker_9",
"ru_speaker_0-Male BARK": "v2/ru_speaker_0",
"ru_speaker_1-Male BARK": "v2/ru_speaker_1",
"ru_speaker_2-Male BARK": "v2/ru_speaker_2",
"ru_speaker_3-Male BARK": "v2/ru_speaker_3",
"ru_speaker_4-Male BARK": "v2/ru_speaker_4",
"ru_speaker_5-Female BARK": "v2/ru_speaker_5",
"ru_speaker_6-Female BARK": "v2/ru_speaker_6",
"ru_speaker_7-Male BARK": "v2/ru_speaker_7",
"ru_speaker_8-Male BARK": "v2/ru_speaker_8",
"ru_speaker_9-Female BARK": "v2/ru_speaker_9",
"tr_speaker_0-Male BARK": "v2/tr_speaker_0",
"tr_speaker_1-Male BARK": "v2/tr_speaker_1",
"tr_speaker_2-Male BARK": "v2/tr_speaker_2",
"tr_speaker_3-Male BARK": "v2/tr_speaker_3",
"tr_speaker_4-Female BARK": "v2/tr_speaker_4",
"tr_speaker_5-Female BARK": "v2/tr_speaker_5",
"tr_speaker_6-Male BARK": "v2/tr_speaker_6",
"tr_speaker_7-Male BARK": "v2/tr_speaker_7",
"tr_speaker_8-Male BARK": "v2/tr_speaker_8",
"tr_speaker_9-Male BARK": "v2/tr_speaker_9",
"zh_speaker_0-Male BARK": "v2/zh_speaker_0",
"zh_speaker_1-Male BARK": "v2/zh_speaker_1",
"zh_speaker_2-Male BARK": "v2/zh_speaker_2",
"zh_speaker_3-Male BARK": "v2/zh_speaker_3",
"zh_speaker_4-Female BARK": "v2/zh_speaker_4",
"zh_speaker_5-Male BARK": "v2/zh_speaker_5",
"zh_speaker_6-Female BARK": "v2/zh_speaker_6",
"zh_speaker_7-Female BARK": "v2/zh_speaker_7",
"zh_speaker_8-Male BARK": "v2/zh_speaker_8",
"zh_speaker_9-Female BARK": "v2/zh_speaker_9",
}
VITS_VOICES_LIST = {
"ar-facebook-mms VITS": "facebook/mms-tts-ara",
# 'zh-facebook-mms VITS': 'facebook/mms-tts-cmn',
"zh_Hakka-facebook-mms VITS": "facebook/mms-tts-hak",
"zh_MinNan-facebook-mms VITS": "facebook/mms-tts-nan",
# 'cs-facebook-mms VITS': 'facebook/mms-tts-ces',
# 'da-facebook-mms VITS': 'facebook/mms-tts-dan',
"nl-facebook-mms VITS": "facebook/mms-tts-nld",
"en-facebook-mms VITS": "facebook/mms-tts-eng",
"fi-facebook-mms VITS": "facebook/mms-tts-fin",
"fr-facebook-mms VITS": "facebook/mms-tts-fra",
"de-facebook-mms VITS": "facebook/mms-tts-deu",
"el-facebook-mms VITS": "facebook/mms-tts-ell",
"el_Ancient-facebook-mms VITS": "facebook/mms-tts-grc",
"he-facebook-mms VITS": "facebook/mms-tts-heb",
"hu-facebook-mms VITS": "facebook/mms-tts-hun",
# 'it-facebook-mms VITS': 'facebook/mms-tts-ita',
# 'ja-facebook-mms VITS': 'facebook/mms-tts-jpn',
"ko-facebook-mms VITS": "facebook/mms-tts-kor",
"fa-facebook-mms VITS": "facebook/mms-tts-fas",
"pl-facebook-mms VITS": "facebook/mms-tts-pol",
"pt-facebook-mms VITS": "facebook/mms-tts-por",
"ru-facebook-mms VITS": "facebook/mms-tts-rus",
"es-facebook-mms VITS": "facebook/mms-tts-spa",
"tr-facebook-mms VITS": "facebook/mms-tts-tur",
"uk-facebook-mms VITS": "facebook/mms-tts-ukr",
"ur_arabic-facebook-mms VITS": "facebook/mms-tts-urd-script_arabic",
"ur_devanagari-facebook-mms VITS": "facebook/mms-tts-urd-script_devanagari",
"ur_latin-facebook-mms VITS": "facebook/mms-tts-urd-script_latin",
"vi-facebook-mms VITS": "facebook/mms-tts-vie",
"hi-facebook-mms VITS": "facebook/mms-tts-hin",
"hi_Fiji-facebook-mms VITS": "facebook/mms-tts-hif",
"id-facebook-mms VITS": "facebook/mms-tts-ind",
"bn-facebook-mms VITS": "facebook/mms-tts-ben",
"te-facebook-mms VITS": "facebook/mms-tts-tel",
"mr-facebook-mms VITS": "facebook/mms-tts-mar",
"ta-facebook-mms VITS": "facebook/mms-tts-tam",
"jw-facebook-mms VITS": "facebook/mms-tts-jav",
"jw_Suriname-facebook-mms VITS": "facebook/mms-tts-jvn",
"ca-facebook-mms VITS": "facebook/mms-tts-cat",
"ne-facebook-mms VITS": "facebook/mms-tts-nep",
"th-facebook-mms VITS": "facebook/mms-tts-tha",
"th_Northern-facebook-mms VITS": "facebook/mms-tts-nod",
"sv-facebook-mms VITS": "facebook/mms-tts-swe",
"am-facebook-mms VITS": "facebook/mms-tts-amh",
"cy-facebook-mms VITS": "facebook/mms-tts-cym",
# "et-facebook-mms VITS": "facebook/mms-tts-est",
# "ht-facebook-mms VITS": "facebook/mms-tts-hrv",
"is-facebook-mms VITS": "facebook/mms-tts-isl",
"km-facebook-mms VITS": "facebook/mms-tts-khm",
"km_Northern-facebook-mms VITS": "facebook/mms-tts-kxm",
# "sk-facebook-mms VITS": "facebook/mms-tts-slk",
"sq_Northern-facebook-mms VITS": "facebook/mms-tts-sqi",
"az_South-facebook-mms VITS": "facebook/mms-tts-azb",
"az_North_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-azj-script_cyrillic",
"az_North_script_latin-facebook-mms VITS": "facebook/mms-tts-azj-script_latin",
"bg-facebook-mms VITS": "facebook/mms-tts-bul",
# "gl-facebook-mms VITS": "facebook/mms-tts-glg",
"gu-facebook-mms VITS": "facebook/mms-tts-guj",
"kk-facebook-mms VITS": "facebook/mms-tts-kaz",
"kn-facebook-mms VITS": "facebook/mms-tts-kan",
# "lt-facebook-mms VITS": "facebook/mms-tts-lit",
"lv-facebook-mms VITS": "facebook/mms-tts-lav",
# "mk-facebook-mms VITS": "facebook/mms-tts-mkd",
"ml-facebook-mms VITS": "facebook/mms-tts-mal",
"ms-facebook-mms VITS": "facebook/mms-tts-zlm",
"ms_Central-facebook-mms VITS": "facebook/mms-tts-pse",
"ms_Manado-facebook-mms VITS": "facebook/mms-tts-xmm",
"ro-facebook-mms VITS": "facebook/mms-tts-ron",
# "si-facebook-mms VITS": "facebook/mms-tts-sin",
"sw-facebook-mms VITS": "facebook/mms-tts-swh",
# "af-facebook-mms VITS": "facebook/mms-tts-afr",
# "bs-facebook-mms VITS": "facebook/mms-tts-bos",
"la-facebook-mms VITS": "facebook/mms-tts-lat",
"my-facebook-mms VITS": "facebook/mms-tts-mya",
# "no_Bokmål-facebook-mms VITS": "thomasht86/mms-tts-nob", # verify
"as-facebook-mms VITS": "facebook/mms-tts-asm",
"as_Nagamese-facebook-mms VITS": "facebook/mms-tts-nag",
"eu-facebook-mms VITS": "facebook/mms-tts-eus",
"ha-facebook-mms VITS": "facebook/mms-tts-hau",
"ht-facebook-mms VITS": "facebook/mms-tts-hat",
"hy_Western-facebook-mms VITS": "facebook/mms-tts-hyw",
"lo-facebook-mms VITS": "facebook/mms-tts-lao",
"mg-facebook-mms VITS": "facebook/mms-tts-mlg",
"mn-facebook-mms VITS": "facebook/mms-tts-mon",
# "mt-facebook-mms VITS": "facebook/mms-tts-mlt",
"pa_Eastern-facebook-mms VITS": "facebook/mms-tts-pan",
# "pa_Western-facebook-mms VITS": "facebook/mms-tts-pnb",
# "ps-facebook-mms VITS": "facebook/mms-tts-pus",
# "sl-facebook-mms VITS": "facebook/mms-tts-slv",
"sn-facebook-mms VITS": "facebook/mms-tts-sna",
"so-facebook-mms VITS": "facebook/mms-tts-son",
"tg-facebook-mms VITS": "facebook/mms-tts-tgk",
"tk_script_arabic-facebook-mms VITS": "facebook/mms-tts-tuk-script_arabic",
"tk_script_latin-facebook-mms VITS": "facebook/mms-tts-tuk-script_latin",
"tt-facebook-mms VITS": "facebook/mms-tts-tat",
"tt_Crimean-facebook-mms VITS": "facebook/mms-tts-crh",
"uz_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-uzb-script_cyrillic",
"yo-facebook-mms VITS": "facebook/mms-tts-yor",
"ay-facebook-mms VITS": "facebook/mms-tts-ayr",
"bm-facebook-mms VITS": "facebook/mms-tts-bam",
"ceb-facebook-mms VITS": "facebook/mms-tts-ceb",
"ny-facebook-mms VITS": "facebook/mms-tts-nya",
"dv-facebook-mms VITS": "facebook/mms-tts-div",
"doi-facebook-mms VITS": "facebook/mms-tts-dgo",
"ee-facebook-mms VITS": "facebook/mms-tts-ewe",
"gn-facebook-mms VITS": "facebook/mms-tts-grn",
"ilo-facebook-mms VITS": "facebook/mms-tts-ilo",
"rw-facebook-mms VITS": "facebook/mms-tts-kin",
"kri-facebook-mms VITS": "facebook/mms-tts-kri",
"ku_script_arabic-facebook-mms VITS": "facebook/mms-tts-kmr-script_arabic",
"ku_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-kmr-script_cyrillic",
"ku_script_latin-facebook-mms VITS": "facebook/mms-tts-kmr-script_latin",
"ckb-facebook-mms VITS": "razhan/mms-tts-ckb", # Verify w
"ky-facebook-mms VITS": "facebook/mms-tts-kir",
"lg-facebook-mms VITS": "facebook/mms-tts-lug",
"mai-facebook-mms VITS": "facebook/mms-tts-mai",
"or-facebook-mms VITS": "facebook/mms-tts-ory",
"om-facebook-mms VITS": "facebook/mms-tts-orm",
"qu_Huallaga-facebook-mms VITS": "facebook/mms-tts-qub",
"qu_Lambayeque-facebook-mms VITS": "facebook/mms-tts-quf",
"qu_South_Bolivian-facebook-mms VITS": "facebook/mms-tts-quh",
"qu_North_Bolivian-facebook-mms VITS": "facebook/mms-tts-qul",
"qu_Tena_Lowland-facebook-mms VITS": "facebook/mms-tts-quw",
"qu_Ayacucho-facebook-mms VITS": "facebook/mms-tts-quy",
"qu_Cusco-facebook-mms VITS": "facebook/mms-tts-quz",
"qu_Cajamarca-facebook-mms VITS": "facebook/mms-tts-qvc",
"qu_Eastern_Apurímac-facebook-mms VITS": "facebook/mms-tts-qve",
"qu_Huamalíes_Dos_de_Mayo_Huánuco-facebook-mms VITS": "facebook/mms-tts-qvh",
"qu_Margos_Yarowilca_Lauricocha-facebook-mms VITS": "facebook/mms-tts-qvm",
"qu_North_Junín-facebook-mms VITS": "facebook/mms-tts-qvn",
"qu_Napo-facebook-mms VITS": "facebook/mms-tts-qvo",
"qu_San_Martín-facebook-mms VITS": "facebook/mms-tts-qvs",
"qu_Huaylla_Wanca-facebook-mms VITS": "facebook/mms-tts-qvw",
"qu_Northern_Pastaza-facebook-mms VITS": "facebook/mms-tts-qvz",
"qu_Huaylas_Ancash-facebook-mms VITS": "facebook/mms-tts-qwh",
"qu_Panao-facebook-mms VITS": "facebook/mms-tts-qxh",
"qu_Salasaca_Highland-facebook-mms VITS": "facebook/mms-tts-qxl",
"qu_Northern_Conchucos_Ancash-facebook-mms VITS": "facebook/mms-tts-qxn",
"qu_Southern_Conchucos-facebook-mms VITS": "facebook/mms-tts-qxo",
"qu_Cañar_Highland-facebook-mms VITS": "facebook/mms-tts-qxr",
"sm-facebook-mms VITS": "facebook/mms-tts-smo",
"ti-facebook-mms VITS": "facebook/mms-tts-tir",
"ts-facebook-mms VITS": "facebook/mms-tts-tso",
"ak-facebook-mms VITS": "facebook/mms-tts-aka",
"ug_script_arabic-facebook-mms VITS": "facebook/mms-tts-uig-script_arabic",
"ug_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-uig-script_cyrillic",
}
OPENAI_TTS_CODES = [
"af", "ar", "hy", "az", "be", "bs", "bg", "ca", "zh", "hr", "cs", "da",
"nl", "en", "et", "fi", "fr", "gl", "de", "el", "he", "hi", "hu", "is",
"id", "it", "ja", "kn", "kk", "ko", "lv", "lt", "mk", "ms", "mr", "mi",
"ne", "no", "fa", "pl", "pt", "ro", "ru", "sr", "sk", "sl", "es", "sw",
"sv", "tl", "ta", "th", "tr", "uk", "ur", "vi", "cy", "zh-TW"
]
OPENAI_TTS_MODELS = [
">alloy OpenAI-TTS",
">echo OpenAI-TTS",
">fable OpenAI-TTS",
">onyx OpenAI-TTS",
">nova OpenAI-TTS",
">shimmer OpenAI-TTS",
">alloy HD OpenAI-TTS",
">echo HD OpenAI-TTS",
">fable HD OpenAI-TTS",
">onyx HD OpenAI-TTS",
">nova HD OpenAI-TTS",
">shimmer HD OpenAI-TTS"
]
LANGUAGE_CODE_IN_THREE_LETTERS = {
"Automatic detection": "aut",
"ar": "ara",
"zh": "chi",
"cs": "cze",
"da": "dan",
"nl": "dut",
"en": "eng",
"fi": "fin",
"fr": "fre",
"de": "ger",
"el": "gre",
"he": "heb",
"hu": "hun",
"it": "ita",
"ja": "jpn",
"ko": "kor",
"fa": "per",
"pl": "pol",
"pt": "por",
"ru": "rus",
"es": "spa",
"tr": "tur",
"uk": "ukr",
"ur": "urd",
"vi": "vie",
"hi": "hin",
"id": "ind",
"bn": "ben",
"te": "tel",
"mr": "mar",
"ta": "tam",
"jw": "jav",
"ca": "cat",
"ne": "nep",
"th": "tha",
"sv": "swe",
"am": "amh",
"cy": "cym",
"et": "est",
"hr": "hrv",
"is": "isl",
"km": "khm",
"sk": "slk",
"sq": "sqi",
"sr": "srp",
}