Spaces:
Sleeping
Sleeping
from .logging_setup import logger | |
LANGUAGES_UNIDIRECTIONAL = { | |
"Aymara (ay)": "ay", | |
"Bambara (bm)": "bm", | |
"Cebuano (ceb)": "ceb", | |
"Chichewa (ny)": "ny", | |
"Divehi (dv)": "dv", | |
"Dogri (doi)": "doi", | |
"Ewe (ee)": "ee", | |
"Guarani (gn)": "gn", | |
"Iloko (ilo)": "ilo", | |
"Kinyarwanda (rw)": "rw", | |
"Krio (kri)": "kri", | |
"Kurdish (ku)": "ku", | |
"Kirghiz (ky)": "ky", | |
"Ganda (lg)": "lg", | |
"Maithili (mai)": "mai", | |
"Oriya (or)": "or", | |
"Oromo (om)": "om", | |
"Quechua (qu)": "qu", | |
"Samoan (sm)": "sm", | |
"Tigrinya (ti)": "ti", | |
"Tsonga (ts)": "ts", | |
"Akan (ak)": "ak", | |
"Uighur (ug)": "ug" | |
} | |
UNIDIRECTIONAL_L_LIST = LANGUAGES_UNIDIRECTIONAL.keys() | |
LANGUAGES = { | |
"Automatic detection": "Automatic detection", | |
"Arabic (ar)": "ar", | |
"Chinese - Simplified (zh-CN)": "zh", | |
"Czech (cs)": "cs", | |
"Danish (da)": "da", | |
"Dutch (nl)": "nl", | |
"English (en)": "en", | |
"Finnish (fi)": "fi", | |
"French (fr)": "fr", | |
"German (de)": "de", | |
"Greek (el)": "el", | |
"Hebrew (he)": "he", | |
"Hungarian (hu)": "hu", | |
"Italian (it)": "it", | |
"Japanese (ja)": "ja", | |
"Korean (ko)": "ko", | |
"Persian (fa)": "fa", # no aux gTTS | |
"Polish (pl)": "pl", | |
"Portuguese (pt)": "pt", | |
"Russian (ru)": "ru", | |
"Spanish (es)": "es", | |
"Turkish (tr)": "tr", | |
"Ukrainian (uk)": "uk", | |
"Urdu (ur)": "ur", | |
"Vietnamese (vi)": "vi", | |
"Hindi (hi)": "hi", | |
"Indonesian (id)": "id", | |
"Bengali (bn)": "bn", | |
"Telugu (te)": "te", | |
"Marathi (mr)": "mr", | |
"Tamil (ta)": "ta", | |
"Javanese (jw|jv)": "jw", | |
"Catalan (ca)": "ca", | |
"Nepali (ne)": "ne", | |
"Thai (th)": "th", | |
"Swedish (sv)": "sv", | |
"Amharic (am)": "am", | |
"Welsh (cy)": "cy", # no aux gTTS | |
"Estonian (et)": "et", | |
"Croatian (hr)": "hr", | |
"Icelandic (is)": "is", | |
"Georgian (ka)": "ka", # no aux gTTS | |
"Khmer (km)": "km", | |
"Slovak (sk)": "sk", | |
"Albanian (sq)": "sq", | |
"Serbian (sr)": "sr", | |
"Azerbaijani (az)": "az", # no aux gTTS | |
"Bulgarian (bg)": "bg", | |
"Galician (gl)": "gl", # no aux gTTS | |
"Gujarati (gu)": "gu", | |
"Kazakh (kk)": "kk", # no aux gTTS | |
"Kannada (kn)": "kn", | |
"Lithuanian (lt)": "lt", # no aux gTTS | |
"Latvian (lv)": "lv", | |
"Macedonian (mk)": "mk", # no aux gTTS # error get align model | |
"Malayalam (ml)": "ml", | |
"Malay (ms)": "ms", # error get align model | |
"Romanian (ro)": "ro", | |
"Sinhala (si)": "si", | |
"Sundanese (su)": "su", | |
"Swahili (sw)": "sw", # error aling | |
"Afrikaans (af)": "af", | |
"Bosnian (bs)": "bs", | |
"Latin (la)": "la", | |
"Myanmar Burmese (my)": "my", | |
"Norwegian (no|nb)": "no", | |
"Chinese - Traditional (zh-TW)": "zh-TW", | |
"Assamese (as)": "as", | |
"Basque (eu)": "eu", | |
"Hausa (ha)": "ha", | |
"Haitian Creole (ht)": "ht", | |
"Armenian (hy)": "hy", | |
"Lao (lo)": "lo", | |
"Malagasy (mg)": "mg", | |
"Mongolian (mn)": "mn", | |
"Maltese (mt)": "mt", | |
"Punjabi (pa)": "pa", | |
"Pashto (ps)": "ps", | |
"Slovenian (sl)": "sl", | |
"Shona (sn)": "sn", | |
"Somali (so)": "so", | |
"Tajik (tg)": "tg", | |
"Turkmen (tk)": "tk", | |
"Tatar (tt)": "tt", | |
"Uzbek (uz)": "uz", | |
"Yoruba (yo)": "yo", | |
**LANGUAGES_UNIDIRECTIONAL | |
} | |
BASE_L_LIST = LANGUAGES.keys() | |
LANGUAGES_LIST = [list(BASE_L_LIST)[0]] + sorted(list(BASE_L_LIST)[1:]) | |
INVERTED_LANGUAGES = {value: key for key, value in LANGUAGES.items()} | |
EXTRA_ALIGN = { | |
"id": "indonesian-nlp/wav2vec2-large-xlsr-indonesian", | |
"bn": "arijitx/wav2vec2-large-xlsr-bengali", | |
"mr": "sumedh/wav2vec2-large-xlsr-marathi", | |
"ta": "Amrrs/wav2vec2-large-xlsr-53-tamil", | |
"jw": "cahya/wav2vec2-large-xlsr-javanese", | |
"ne": "shniranjan/wav2vec2-large-xlsr-300m-nepali", | |
"th": "sakares/wav2vec2-large-xlsr-thai-demo", | |
"sv": "KBLab/wav2vec2-large-voxrex-swedish", | |
"am": "agkphysics/wav2vec2-large-xlsr-53-amharic", | |
"cy": "Srulikbdd/Wav2Vec2-large-xlsr-welsh", | |
"et": "anton-l/wav2vec2-large-xlsr-53-estonian", | |
"hr": "classla/wav2vec2-xls-r-parlaspeech-hr", | |
"is": "carlosdanielhernandezmena/wav2vec2-large-xlsr-53-icelandic-ep10-1000h", | |
"ka": "MehdiHosseiniMoghadam/wav2vec2-large-xlsr-53-Georgian", | |
"km": "vitouphy/wav2vec2-xls-r-300m-khmer", | |
"sk": "infinitejoy/wav2vec2-large-xls-r-300m-slovak", | |
"sq": "Alimzhan/wav2vec2-large-xls-r-300m-albanian-colab", | |
"sr": "dnikolic/wav2vec2-xlsr-530-serbian-colab", | |
"az": "nijatzeynalov/wav2vec2-large-mms-1b-azerbaijani-common_voice15.0", | |
"bg": "infinitejoy/wav2vec2-large-xls-r-300m-bulgarian", | |
"gl": "ifrz/wav2vec2-large-xlsr-galician", | |
"gu": "Harveenchadha/vakyansh-wav2vec2-gujarati-gnm-100", | |
"kk": "aismlv/wav2vec2-large-xlsr-kazakh", | |
"kn": "Harveenchadha/vakyansh-wav2vec2-kannada-knm-560", | |
"lt": "DeividasM/wav2vec2-large-xlsr-53-lithuanian", | |
"lv": "anton-l/wav2vec2-large-xlsr-53-latvian", | |
"mk": "", # Konstantin-Bogdanoski/wav2vec2-macedonian-base | |
"ml": "gvs/wav2vec2-large-xlsr-malayalam", | |
"ms": "", # Duy/wav2vec2_malay | |
"ro": "anton-l/wav2vec2-large-xlsr-53-romanian", | |
"si": "IAmNotAnanth/wav2vec2-large-xls-r-300m-sinhala", | |
"su": "cahya/wav2vec2-large-xlsr-sundanese", | |
"sw": "", # Lians/fine-tune-wav2vec2-large-swahili | |
"af": "", # ylacombe/wav2vec2-common_voice-af-demo | |
"bs": "", | |
"la": "", | |
"my": "", | |
"no": "NbAiLab/wav2vec2-xlsr-300m-norwegian", | |
"zh-TW": "jonatasgrosman/wav2vec2-large-xlsr-53-chinese-zh-cn", | |
"as": "", | |
"eu": "", # cahya/wav2vec2-large-xlsr-basque # verify | |
"ha": "infinitejoy/wav2vec2-large-xls-r-300m-hausa", | |
"ht": "", | |
"hy": "infinitejoy/wav2vec2-large-xls-r-300m-armenian", # no (.) | |
"lo": "", | |
"mg": "", | |
"mn": "tugstugi/wav2vec2-large-xlsr-53-mongolian", | |
"mt": "carlosdanielhernandezmena/wav2vec2-large-xlsr-53-maltese-64h", | |
"pa": "kingabzpro/wav2vec2-large-xlsr-53-punjabi", | |
"ps": "aamirhs/wav2vec2-large-xls-r-300m-pashto-colab", | |
"sl": "anton-l/wav2vec2-large-xlsr-53-slovenian", | |
"sn": "", | |
"so": "", | |
"tg": "", | |
"tk": "", # Ragav/wav2vec2-tk | |
"tt": "anton-l/wav2vec2-large-xlsr-53-tatar", | |
"uz": "", # Mekhriddin/wav2vec2-large-xls-r-300m-uzbek-colab | |
"yo": "ogbi/wav2vec2-large-mms-1b-yoruba-test", | |
} | |
def fix_code_language(translate_to, syntax="google"): | |
if syntax == "google": | |
# google-translator, gTTS | |
replace_lang_code = {"zh": "zh-CN", "he": "iw", "zh-cn": "zh-CN"} | |
elif syntax == "coqui": | |
# coqui-xtts | |
replace_lang_code = {"zh": "zh-cn", "zh-CN": "zh-cn", "zh-TW": "zh-cn"} | |
new_code_lang = replace_lang_code.get(translate_to, translate_to) | |
logger.debug(f"Fix code {translate_to} -> {new_code_lang}") | |
return new_code_lang | |
BARK_VOICES_LIST = { | |
"de_speaker_0-Male BARK": "v2/de_speaker_0", | |
"de_speaker_1-Male BARK": "v2/de_speaker_1", | |
"de_speaker_2-Male BARK": "v2/de_speaker_2", | |
"de_speaker_3-Female BARK": "v2/de_speaker_3", | |
"de_speaker_4-Male BARK": "v2/de_speaker_4", | |
"de_speaker_5-Male BARK": "v2/de_speaker_5", | |
"de_speaker_6-Male BARK": "v2/de_speaker_6", | |
"de_speaker_7-Male BARK": "v2/de_speaker_7", | |
"de_speaker_8-Female BARK": "v2/de_speaker_8", | |
"de_speaker_9-Male BARK": "v2/de_speaker_9", | |
"en_speaker_0-Male BARK": "v2/en_speaker_0", | |
"en_speaker_1-Male BARK": "v2/en_speaker_1", | |
"en_speaker_2-Male BARK": "v2/en_speaker_2", | |
"en_speaker_3-Male BARK": "v2/en_speaker_3", | |
"en_speaker_4-Male BARK": "v2/en_speaker_4", | |
"en_speaker_5-Male BARK": "v2/en_speaker_5", | |
"en_speaker_6-Male BARK": "v2/en_speaker_6", | |
"en_speaker_7-Male BARK": "v2/en_speaker_7", | |
"en_speaker_8-Male BARK": "v2/en_speaker_8", | |
"en_speaker_9-Female BARK": "v2/en_speaker_9", | |
"es_speaker_0-Male BARK": "v2/es_speaker_0", | |
"es_speaker_1-Male BARK": "v2/es_speaker_1", | |
"es_speaker_2-Male BARK": "v2/es_speaker_2", | |
"es_speaker_3-Male BARK": "v2/es_speaker_3", | |
"es_speaker_4-Male BARK": "v2/es_speaker_4", | |
"es_speaker_5-Male BARK": "v2/es_speaker_5", | |
"es_speaker_6-Male BARK": "v2/es_speaker_6", | |
"es_speaker_7-Male BARK": "v2/es_speaker_7", | |
"es_speaker_8-Female BARK": "v2/es_speaker_8", | |
"es_speaker_9-Female BARK": "v2/es_speaker_9", | |
"fr_speaker_0-Male BARK": "v2/fr_speaker_0", | |
"fr_speaker_1-Female BARK": "v2/fr_speaker_1", | |
"fr_speaker_2-Female BARK": "v2/fr_speaker_2", | |
"fr_speaker_3-Male BARK": "v2/fr_speaker_3", | |
"fr_speaker_4-Male BARK": "v2/fr_speaker_4", | |
"fr_speaker_5-Female BARK": "v2/fr_speaker_5", | |
"fr_speaker_6-Male BARK": "v2/fr_speaker_6", | |
"fr_speaker_7-Male BARK": "v2/fr_speaker_7", | |
"fr_speaker_8-Male BARK": "v2/fr_speaker_8", | |
"fr_speaker_9-Male BARK": "v2/fr_speaker_9", | |
"hi_speaker_0-Female BARK": "v2/hi_speaker_0", | |
"hi_speaker_1-Female BARK": "v2/hi_speaker_1", | |
"hi_speaker_2-Male BARK": "v2/hi_speaker_2", | |
"hi_speaker_3-Female BARK": "v2/hi_speaker_3", | |
"hi_speaker_4-Female BARK": "v2/hi_speaker_4", | |
"hi_speaker_5-Male BARK": "v2/hi_speaker_5", | |
"hi_speaker_6-Male BARK": "v2/hi_speaker_6", | |
"hi_speaker_7-Male BARK": "v2/hi_speaker_7", | |
"hi_speaker_8-Male BARK": "v2/hi_speaker_8", | |
"hi_speaker_9-Female BARK": "v2/hi_speaker_9", | |
"it_speaker_0-Male BARK": "v2/it_speaker_0", | |
"it_speaker_1-Male BARK": "v2/it_speaker_1", | |
"it_speaker_2-Female BARK": "v2/it_speaker_2", | |
"it_speaker_3-Male BARK": "v2/it_speaker_3", | |
"it_speaker_4-Male BARK": "v2/it_speaker_4", | |
"it_speaker_5-Male BARK": "v2/it_speaker_5", | |
"it_speaker_6-Male BARK": "v2/it_speaker_6", | |
"it_speaker_7-Female BARK": "v2/it_speaker_7", | |
"it_speaker_8-Male BARK": "v2/it_speaker_8", | |
"it_speaker_9-Female BARK": "v2/it_speaker_9", | |
"ja_speaker_0-Female BARK": "v2/ja_speaker_0", | |
"ja_speaker_1-Female BARK": "v2/ja_speaker_1", | |
"ja_speaker_2-Male BARK": "v2/ja_speaker_2", | |
"ja_speaker_3-Female BARK": "v2/ja_speaker_3", | |
"ja_speaker_4-Female BARK": "v2/ja_speaker_4", | |
"ja_speaker_5-Female BARK": "v2/ja_speaker_5", | |
"ja_speaker_6-Male BARK": "v2/ja_speaker_6", | |
"ja_speaker_7-Female BARK": "v2/ja_speaker_7", | |
"ja_speaker_8-Female BARK": "v2/ja_speaker_8", | |
"ja_speaker_9-Female BARK": "v2/ja_speaker_9", | |
"ko_speaker_0-Female BARK": "v2/ko_speaker_0", | |
"ko_speaker_1-Male BARK": "v2/ko_speaker_1", | |
"ko_speaker_2-Male BARK": "v2/ko_speaker_2", | |
"ko_speaker_3-Male BARK": "v2/ko_speaker_3", | |
"ko_speaker_4-Male BARK": "v2/ko_speaker_4", | |
"ko_speaker_5-Male BARK": "v2/ko_speaker_5", | |
"ko_speaker_6-Male BARK": "v2/ko_speaker_6", | |
"ko_speaker_7-Male BARK": "v2/ko_speaker_7", | |
"ko_speaker_8-Male BARK": "v2/ko_speaker_8", | |
"ko_speaker_9-Male BARK": "v2/ko_speaker_9", | |
"pl_speaker_0-Male BARK": "v2/pl_speaker_0", | |
"pl_speaker_1-Male BARK": "v2/pl_speaker_1", | |
"pl_speaker_2-Male BARK": "v2/pl_speaker_2", | |
"pl_speaker_3-Male BARK": "v2/pl_speaker_3", | |
"pl_speaker_4-Female BARK": "v2/pl_speaker_4", | |
"pl_speaker_5-Male BARK": "v2/pl_speaker_5", | |
"pl_speaker_6-Female BARK": "v2/pl_speaker_6", | |
"pl_speaker_7-Male BARK": "v2/pl_speaker_7", | |
"pl_speaker_8-Male BARK": "v2/pl_speaker_8", | |
"pl_speaker_9-Female BARK": "v2/pl_speaker_9", | |
"pt_speaker_0-Male BARK": "v2/pt_speaker_0", | |
"pt_speaker_1-Male BARK": "v2/pt_speaker_1", | |
"pt_speaker_2-Male BARK": "v2/pt_speaker_2", | |
"pt_speaker_3-Male BARK": "v2/pt_speaker_3", | |
"pt_speaker_4-Male BARK": "v2/pt_speaker_4", | |
"pt_speaker_5-Male BARK": "v2/pt_speaker_5", | |
"pt_speaker_6-Male BARK": "v2/pt_speaker_6", | |
"pt_speaker_7-Male BARK": "v2/pt_speaker_7", | |
"pt_speaker_8-Male BARK": "v2/pt_speaker_8", | |
"pt_speaker_9-Male BARK": "v2/pt_speaker_9", | |
"ru_speaker_0-Male BARK": "v2/ru_speaker_0", | |
"ru_speaker_1-Male BARK": "v2/ru_speaker_1", | |
"ru_speaker_2-Male BARK": "v2/ru_speaker_2", | |
"ru_speaker_3-Male BARK": "v2/ru_speaker_3", | |
"ru_speaker_4-Male BARK": "v2/ru_speaker_4", | |
"ru_speaker_5-Female BARK": "v2/ru_speaker_5", | |
"ru_speaker_6-Female BARK": "v2/ru_speaker_6", | |
"ru_speaker_7-Male BARK": "v2/ru_speaker_7", | |
"ru_speaker_8-Male BARK": "v2/ru_speaker_8", | |
"ru_speaker_9-Female BARK": "v2/ru_speaker_9", | |
"tr_speaker_0-Male BARK": "v2/tr_speaker_0", | |
"tr_speaker_1-Male BARK": "v2/tr_speaker_1", | |
"tr_speaker_2-Male BARK": "v2/tr_speaker_2", | |
"tr_speaker_3-Male BARK": "v2/tr_speaker_3", | |
"tr_speaker_4-Female BARK": "v2/tr_speaker_4", | |
"tr_speaker_5-Female BARK": "v2/tr_speaker_5", | |
"tr_speaker_6-Male BARK": "v2/tr_speaker_6", | |
"tr_speaker_7-Male BARK": "v2/tr_speaker_7", | |
"tr_speaker_8-Male BARK": "v2/tr_speaker_8", | |
"tr_speaker_9-Male BARK": "v2/tr_speaker_9", | |
"zh_speaker_0-Male BARK": "v2/zh_speaker_0", | |
"zh_speaker_1-Male BARK": "v2/zh_speaker_1", | |
"zh_speaker_2-Male BARK": "v2/zh_speaker_2", | |
"zh_speaker_3-Male BARK": "v2/zh_speaker_3", | |
"zh_speaker_4-Female BARK": "v2/zh_speaker_4", | |
"zh_speaker_5-Male BARK": "v2/zh_speaker_5", | |
"zh_speaker_6-Female BARK": "v2/zh_speaker_6", | |
"zh_speaker_7-Female BARK": "v2/zh_speaker_7", | |
"zh_speaker_8-Male BARK": "v2/zh_speaker_8", | |
"zh_speaker_9-Female BARK": "v2/zh_speaker_9", | |
} | |
VITS_VOICES_LIST = { | |
"ar-facebook-mms VITS": "facebook/mms-tts-ara", | |
# 'zh-facebook-mms VITS': 'facebook/mms-tts-cmn', | |
"zh_Hakka-facebook-mms VITS": "facebook/mms-tts-hak", | |
"zh_MinNan-facebook-mms VITS": "facebook/mms-tts-nan", | |
# 'cs-facebook-mms VITS': 'facebook/mms-tts-ces', | |
# 'da-facebook-mms VITS': 'facebook/mms-tts-dan', | |
"nl-facebook-mms VITS": "facebook/mms-tts-nld", | |
"en-facebook-mms VITS": "facebook/mms-tts-eng", | |
"fi-facebook-mms VITS": "facebook/mms-tts-fin", | |
"fr-facebook-mms VITS": "facebook/mms-tts-fra", | |
"de-facebook-mms VITS": "facebook/mms-tts-deu", | |
"el-facebook-mms VITS": "facebook/mms-tts-ell", | |
"el_Ancient-facebook-mms VITS": "facebook/mms-tts-grc", | |
"he-facebook-mms VITS": "facebook/mms-tts-heb", | |
"hu-facebook-mms VITS": "facebook/mms-tts-hun", | |
# 'it-facebook-mms VITS': 'facebook/mms-tts-ita', | |
# 'ja-facebook-mms VITS': 'facebook/mms-tts-jpn', | |
"ko-facebook-mms VITS": "facebook/mms-tts-kor", | |
"fa-facebook-mms VITS": "facebook/mms-tts-fas", | |
"pl-facebook-mms VITS": "facebook/mms-tts-pol", | |
"pt-facebook-mms VITS": "facebook/mms-tts-por", | |
"ru-facebook-mms VITS": "facebook/mms-tts-rus", | |
"es-facebook-mms VITS": "facebook/mms-tts-spa", | |
"tr-facebook-mms VITS": "facebook/mms-tts-tur", | |
"uk-facebook-mms VITS": "facebook/mms-tts-ukr", | |
"ur_arabic-facebook-mms VITS": "facebook/mms-tts-urd-script_arabic", | |
"ur_devanagari-facebook-mms VITS": "facebook/mms-tts-urd-script_devanagari", | |
"ur_latin-facebook-mms VITS": "facebook/mms-tts-urd-script_latin", | |
"vi-facebook-mms VITS": "facebook/mms-tts-vie", | |
"hi-facebook-mms VITS": "facebook/mms-tts-hin", | |
"hi_Fiji-facebook-mms VITS": "facebook/mms-tts-hif", | |
"id-facebook-mms VITS": "facebook/mms-tts-ind", | |
"bn-facebook-mms VITS": "facebook/mms-tts-ben", | |
"te-facebook-mms VITS": "facebook/mms-tts-tel", | |
"mr-facebook-mms VITS": "facebook/mms-tts-mar", | |
"ta-facebook-mms VITS": "facebook/mms-tts-tam", | |
"jw-facebook-mms VITS": "facebook/mms-tts-jav", | |
"jw_Suriname-facebook-mms VITS": "facebook/mms-tts-jvn", | |
"ca-facebook-mms VITS": "facebook/mms-tts-cat", | |
"ne-facebook-mms VITS": "facebook/mms-tts-nep", | |
"th-facebook-mms VITS": "facebook/mms-tts-tha", | |
"th_Northern-facebook-mms VITS": "facebook/mms-tts-nod", | |
"sv-facebook-mms VITS": "facebook/mms-tts-swe", | |
"am-facebook-mms VITS": "facebook/mms-tts-amh", | |
"cy-facebook-mms VITS": "facebook/mms-tts-cym", | |
# "et-facebook-mms VITS": "facebook/mms-tts-est", | |
# "ht-facebook-mms VITS": "facebook/mms-tts-hrv", | |
"is-facebook-mms VITS": "facebook/mms-tts-isl", | |
"km-facebook-mms VITS": "facebook/mms-tts-khm", | |
"km_Northern-facebook-mms VITS": "facebook/mms-tts-kxm", | |
# "sk-facebook-mms VITS": "facebook/mms-tts-slk", | |
"sq_Northern-facebook-mms VITS": "facebook/mms-tts-sqi", | |
"az_South-facebook-mms VITS": "facebook/mms-tts-azb", | |
"az_North_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-azj-script_cyrillic", | |
"az_North_script_latin-facebook-mms VITS": "facebook/mms-tts-azj-script_latin", | |
"bg-facebook-mms VITS": "facebook/mms-tts-bul", | |
# "gl-facebook-mms VITS": "facebook/mms-tts-glg", | |
"gu-facebook-mms VITS": "facebook/mms-tts-guj", | |
"kk-facebook-mms VITS": "facebook/mms-tts-kaz", | |
"kn-facebook-mms VITS": "facebook/mms-tts-kan", | |
# "lt-facebook-mms VITS": "facebook/mms-tts-lit", | |
"lv-facebook-mms VITS": "facebook/mms-tts-lav", | |
# "mk-facebook-mms VITS": "facebook/mms-tts-mkd", | |
"ml-facebook-mms VITS": "facebook/mms-tts-mal", | |
"ms-facebook-mms VITS": "facebook/mms-tts-zlm", | |
"ms_Central-facebook-mms VITS": "facebook/mms-tts-pse", | |
"ms_Manado-facebook-mms VITS": "facebook/mms-tts-xmm", | |
"ro-facebook-mms VITS": "facebook/mms-tts-ron", | |
# "si-facebook-mms VITS": "facebook/mms-tts-sin", | |
"sw-facebook-mms VITS": "facebook/mms-tts-swh", | |
# "af-facebook-mms VITS": "facebook/mms-tts-afr", | |
# "bs-facebook-mms VITS": "facebook/mms-tts-bos", | |
"la-facebook-mms VITS": "facebook/mms-tts-lat", | |
"my-facebook-mms VITS": "facebook/mms-tts-mya", | |
# "no_Bokmål-facebook-mms VITS": "thomasht86/mms-tts-nob", # verify | |
"as-facebook-mms VITS": "facebook/mms-tts-asm", | |
"as_Nagamese-facebook-mms VITS": "facebook/mms-tts-nag", | |
"eu-facebook-mms VITS": "facebook/mms-tts-eus", | |
"ha-facebook-mms VITS": "facebook/mms-tts-hau", | |
"ht-facebook-mms VITS": "facebook/mms-tts-hat", | |
"hy_Western-facebook-mms VITS": "facebook/mms-tts-hyw", | |
"lo-facebook-mms VITS": "facebook/mms-tts-lao", | |
"mg-facebook-mms VITS": "facebook/mms-tts-mlg", | |
"mn-facebook-mms VITS": "facebook/mms-tts-mon", | |
# "mt-facebook-mms VITS": "facebook/mms-tts-mlt", | |
"pa_Eastern-facebook-mms VITS": "facebook/mms-tts-pan", | |
# "pa_Western-facebook-mms VITS": "facebook/mms-tts-pnb", | |
# "ps-facebook-mms VITS": "facebook/mms-tts-pus", | |
# "sl-facebook-mms VITS": "facebook/mms-tts-slv", | |
"sn-facebook-mms VITS": "facebook/mms-tts-sna", | |
"so-facebook-mms VITS": "facebook/mms-tts-son", | |
"tg-facebook-mms VITS": "facebook/mms-tts-tgk", | |
"tk_script_arabic-facebook-mms VITS": "facebook/mms-tts-tuk-script_arabic", | |
"tk_script_latin-facebook-mms VITS": "facebook/mms-tts-tuk-script_latin", | |
"tt-facebook-mms VITS": "facebook/mms-tts-tat", | |
"tt_Crimean-facebook-mms VITS": "facebook/mms-tts-crh", | |
"uz_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-uzb-script_cyrillic", | |
"yo-facebook-mms VITS": "facebook/mms-tts-yor", | |
"ay-facebook-mms VITS": "facebook/mms-tts-ayr", | |
"bm-facebook-mms VITS": "facebook/mms-tts-bam", | |
"ceb-facebook-mms VITS": "facebook/mms-tts-ceb", | |
"ny-facebook-mms VITS": "facebook/mms-tts-nya", | |
"dv-facebook-mms VITS": "facebook/mms-tts-div", | |
"doi-facebook-mms VITS": "facebook/mms-tts-dgo", | |
"ee-facebook-mms VITS": "facebook/mms-tts-ewe", | |
"gn-facebook-mms VITS": "facebook/mms-tts-grn", | |
"ilo-facebook-mms VITS": "facebook/mms-tts-ilo", | |
"rw-facebook-mms VITS": "facebook/mms-tts-kin", | |
"kri-facebook-mms VITS": "facebook/mms-tts-kri", | |
"ku_script_arabic-facebook-mms VITS": "facebook/mms-tts-kmr-script_arabic", | |
"ku_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-kmr-script_cyrillic", | |
"ku_script_latin-facebook-mms VITS": "facebook/mms-tts-kmr-script_latin", | |
"ckb-facebook-mms VITS": "razhan/mms-tts-ckb", # Verify w | |
"ky-facebook-mms VITS": "facebook/mms-tts-kir", | |
"lg-facebook-mms VITS": "facebook/mms-tts-lug", | |
"mai-facebook-mms VITS": "facebook/mms-tts-mai", | |
"or-facebook-mms VITS": "facebook/mms-tts-ory", | |
"om-facebook-mms VITS": "facebook/mms-tts-orm", | |
"qu_Huallaga-facebook-mms VITS": "facebook/mms-tts-qub", | |
"qu_Lambayeque-facebook-mms VITS": "facebook/mms-tts-quf", | |
"qu_South_Bolivian-facebook-mms VITS": "facebook/mms-tts-quh", | |
"qu_North_Bolivian-facebook-mms VITS": "facebook/mms-tts-qul", | |
"qu_Tena_Lowland-facebook-mms VITS": "facebook/mms-tts-quw", | |
"qu_Ayacucho-facebook-mms VITS": "facebook/mms-tts-quy", | |
"qu_Cusco-facebook-mms VITS": "facebook/mms-tts-quz", | |
"qu_Cajamarca-facebook-mms VITS": "facebook/mms-tts-qvc", | |
"qu_Eastern_Apurímac-facebook-mms VITS": "facebook/mms-tts-qve", | |
"qu_Huamalíes_Dos_de_Mayo_Huánuco-facebook-mms VITS": "facebook/mms-tts-qvh", | |
"qu_Margos_Yarowilca_Lauricocha-facebook-mms VITS": "facebook/mms-tts-qvm", | |
"qu_North_Junín-facebook-mms VITS": "facebook/mms-tts-qvn", | |
"qu_Napo-facebook-mms VITS": "facebook/mms-tts-qvo", | |
"qu_San_Martín-facebook-mms VITS": "facebook/mms-tts-qvs", | |
"qu_Huaylla_Wanca-facebook-mms VITS": "facebook/mms-tts-qvw", | |
"qu_Northern_Pastaza-facebook-mms VITS": "facebook/mms-tts-qvz", | |
"qu_Huaylas_Ancash-facebook-mms VITS": "facebook/mms-tts-qwh", | |
"qu_Panao-facebook-mms VITS": "facebook/mms-tts-qxh", | |
"qu_Salasaca_Highland-facebook-mms VITS": "facebook/mms-tts-qxl", | |
"qu_Northern_Conchucos_Ancash-facebook-mms VITS": "facebook/mms-tts-qxn", | |
"qu_Southern_Conchucos-facebook-mms VITS": "facebook/mms-tts-qxo", | |
"qu_Cañar_Highland-facebook-mms VITS": "facebook/mms-tts-qxr", | |
"sm-facebook-mms VITS": "facebook/mms-tts-smo", | |
"ti-facebook-mms VITS": "facebook/mms-tts-tir", | |
"ts-facebook-mms VITS": "facebook/mms-tts-tso", | |
"ak-facebook-mms VITS": "facebook/mms-tts-aka", | |
"ug_script_arabic-facebook-mms VITS": "facebook/mms-tts-uig-script_arabic", | |
"ug_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-uig-script_cyrillic", | |
} | |
OPENAI_TTS_CODES = [ | |
"af", "ar", "hy", "az", "be", "bs", "bg", "ca", "zh", "hr", "cs", "da", | |
"nl", "en", "et", "fi", "fr", "gl", "de", "el", "he", "hi", "hu", "is", | |
"id", "it", "ja", "kn", "kk", "ko", "lv", "lt", "mk", "ms", "mr", "mi", | |
"ne", "no", "fa", "pl", "pt", "ro", "ru", "sr", "sk", "sl", "es", "sw", | |
"sv", "tl", "ta", "th", "tr", "uk", "ur", "vi", "cy", "zh-TW" | |
] | |
OPENAI_TTS_MODELS = [ | |
">alloy OpenAI-TTS", | |
">echo OpenAI-TTS", | |
">fable OpenAI-TTS", | |
">onyx OpenAI-TTS", | |
">nova OpenAI-TTS", | |
">shimmer OpenAI-TTS", | |
">alloy HD OpenAI-TTS", | |
">echo HD OpenAI-TTS", | |
">fable HD OpenAI-TTS", | |
">onyx HD OpenAI-TTS", | |
">nova HD OpenAI-TTS", | |
">shimmer HD OpenAI-TTS" | |
] | |
LANGUAGE_CODE_IN_THREE_LETTERS = { | |
"Automatic detection": "aut", | |
"ar": "ara", | |
"zh": "chi", | |
"cs": "cze", | |
"da": "dan", | |
"nl": "dut", | |
"en": "eng", | |
"fi": "fin", | |
"fr": "fre", | |
"de": "ger", | |
"el": "gre", | |
"he": "heb", | |
"hu": "hun", | |
"it": "ita", | |
"ja": "jpn", | |
"ko": "kor", | |
"fa": "per", | |
"pl": "pol", | |
"pt": "por", | |
"ru": "rus", | |
"es": "spa", | |
"tr": "tur", | |
"uk": "ukr", | |
"ur": "urd", | |
"vi": "vie", | |
"hi": "hin", | |
"id": "ind", | |
"bn": "ben", | |
"te": "tel", | |
"mr": "mar", | |
"ta": "tam", | |
"jw": "jav", | |
"ca": "cat", | |
"ne": "nep", | |
"th": "tha", | |
"sv": "swe", | |
"am": "amh", | |
"cy": "cym", | |
"et": "est", | |
"hr": "hrv", | |
"is": "isl", | |
"km": "khm", | |
"sk": "slk", | |
"sq": "sqi", | |
"sr": "srp", | |
} | |