Spaces:
Running
Running
| from .logging_setup import logger | |
| LANGUAGES_UNIDIRECTIONAL = { | |
| "Aymara (ay)": "ay", | |
| "Bambara (bm)": "bm", | |
| "Cebuano (ceb)": "ceb", | |
| "Chichewa (ny)": "ny", | |
| "Divehi (dv)": "dv", | |
| "Dogri (doi)": "doi", | |
| "Ewe (ee)": "ee", | |
| "Guarani (gn)": "gn", | |
| "Iloko (ilo)": "ilo", | |
| "Kinyarwanda (rw)": "rw", | |
| "Krio (kri)": "kri", | |
| "Kurdish (ku)": "ku", | |
| "Kirghiz (ky)": "ky", | |
| "Ganda (lg)": "lg", | |
| "Maithili (mai)": "mai", | |
| "Oriya (or)": "or", | |
| "Oromo (om)": "om", | |
| "Quechua (qu)": "qu", | |
| "Samoan (sm)": "sm", | |
| "Tigrinya (ti)": "ti", | |
| "Tsonga (ts)": "ts", | |
| "Akan (ak)": "ak", | |
| "Uighur (ug)": "ug" | |
| } | |
| UNIDIRECTIONAL_L_LIST = LANGUAGES_UNIDIRECTIONAL.keys() | |
| LANGUAGES = { | |
| "Automatic detection": "Automatic detection", | |
| "Arabic (ar)": "ar", | |
| "Chinese - Simplified (zh-CN)": "zh", | |
| "Czech (cs)": "cs", | |
| "Danish (da)": "da", | |
| "Dutch (nl)": "nl", | |
| "English (en)": "en", | |
| "Finnish (fi)": "fi", | |
| "French (fr)": "fr", | |
| "German (de)": "de", | |
| "Greek (el)": "el", | |
| "Hebrew (he)": "he", | |
| "Hungarian (hu)": "hu", | |
| "Italian (it)": "it", | |
| "Japanese (ja)": "ja", | |
| "Korean (ko)": "ko", | |
| "Persian (fa)": "fa", # no aux gTTS | |
| "Polish (pl)": "pl", | |
| "Portuguese (pt)": "pt", | |
| "Russian (ru)": "ru", | |
| "Spanish (es)": "es", | |
| "Turkish (tr)": "tr", | |
| "Ukrainian (uk)": "uk", | |
| "Urdu (ur)": "ur", | |
| "Vietnamese (vi)": "vi", | |
| "Hindi (hi)": "hi", | |
| "Indonesian (id)": "id", | |
| "Bengali (bn)": "bn", | |
| "Telugu (te)": "te", | |
| "Marathi (mr)": "mr", | |
| "Tamil (ta)": "ta", | |
| "Javanese (jw|jv)": "jw", | |
| "Catalan (ca)": "ca", | |
| "Nepali (ne)": "ne", | |
| "Thai (th)": "th", | |
| "Swedish (sv)": "sv", | |
| "Amharic (am)": "am", | |
| "Welsh (cy)": "cy", # no aux gTTS | |
| "Estonian (et)": "et", | |
| "Croatian (hr)": "hr", | |
| "Icelandic (is)": "is", | |
| "Georgian (ka)": "ka", # no aux gTTS | |
| "Khmer (km)": "km", | |
| "Slovak (sk)": "sk", | |
| "Albanian (sq)": "sq", | |
| "Serbian (sr)": "sr", | |
| "Azerbaijani (az)": "az", # no aux gTTS | |
| "Bulgarian (bg)": "bg", | |
| "Galician (gl)": "gl", # no aux gTTS | |
| "Gujarati (gu)": "gu", | |
| "Kazakh (kk)": "kk", # no aux gTTS | |
| "Kannada (kn)": "kn", | |
| "Lithuanian (lt)": "lt", # no aux gTTS | |
| "Latvian (lv)": "lv", | |
| "Macedonian (mk)": "mk", # no aux gTTS # error get align model | |
| "Malayalam (ml)": "ml", | |
| "Malay (ms)": "ms", # error get align model | |
| "Romanian (ro)": "ro", | |
| "Sinhala (si)": "si", | |
| "Sundanese (su)": "su", | |
| "Swahili (sw)": "sw", # error aling | |
| "Afrikaans (af)": "af", | |
| "Bosnian (bs)": "bs", | |
| "Latin (la)": "la", | |
| "Myanmar Burmese (my)": "my", | |
| "Norwegian (no|nb)": "no", | |
| "Chinese - Traditional (zh-TW)": "zh-TW", | |
| "Assamese (as)": "as", | |
| "Basque (eu)": "eu", | |
| "Hausa (ha)": "ha", | |
| "Haitian Creole (ht)": "ht", | |
| "Armenian (hy)": "hy", | |
| "Lao (lo)": "lo", | |
| "Malagasy (mg)": "mg", | |
| "Mongolian (mn)": "mn", | |
| "Maltese (mt)": "mt", | |
| "Punjabi (pa)": "pa", | |
| "Pashto (ps)": "ps", | |
| "Slovenian (sl)": "sl", | |
| "Shona (sn)": "sn", | |
| "Somali (so)": "so", | |
| "Tajik (tg)": "tg", | |
| "Turkmen (tk)": "tk", | |
| "Tatar (tt)": "tt", | |
| "Uzbek (uz)": "uz", | |
| "Yoruba (yo)": "yo", | |
| **LANGUAGES_UNIDIRECTIONAL | |
| } | |
| BASE_L_LIST = LANGUAGES.keys() | |
| LANGUAGES_LIST = [list(BASE_L_LIST)[0]] + sorted(list(BASE_L_LIST)[1:]) | |
| INVERTED_LANGUAGES = {value: key for key, value in LANGUAGES.items()} | |
| EXTRA_ALIGN = { | |
| "id": "indonesian-nlp/wav2vec2-large-xlsr-indonesian", | |
| "bn": "arijitx/wav2vec2-large-xlsr-bengali", | |
| "mr": "sumedh/wav2vec2-large-xlsr-marathi", | |
| "ta": "Amrrs/wav2vec2-large-xlsr-53-tamil", | |
| "jw": "cahya/wav2vec2-large-xlsr-javanese", | |
| "ne": "shniranjan/wav2vec2-large-xlsr-300m-nepali", | |
| "th": "sakares/wav2vec2-large-xlsr-thai-demo", | |
| "sv": "KBLab/wav2vec2-large-voxrex-swedish", | |
| "am": "agkphysics/wav2vec2-large-xlsr-53-amharic", | |
| "cy": "Srulikbdd/Wav2Vec2-large-xlsr-welsh", | |
| "et": "anton-l/wav2vec2-large-xlsr-53-estonian", | |
| "hr": "classla/wav2vec2-xls-r-parlaspeech-hr", | |
| "is": "carlosdanielhernandezmena/wav2vec2-large-xlsr-53-icelandic-ep10-1000h", | |
| "ka": "MehdiHosseiniMoghadam/wav2vec2-large-xlsr-53-Georgian", | |
| "km": "vitouphy/wav2vec2-xls-r-300m-khmer", | |
| "sk": "infinitejoy/wav2vec2-large-xls-r-300m-slovak", | |
| "sq": "Alimzhan/wav2vec2-large-xls-r-300m-albanian-colab", | |
| "sr": "dnikolic/wav2vec2-xlsr-530-serbian-colab", | |
| "az": "nijatzeynalov/wav2vec2-large-mms-1b-azerbaijani-common_voice15.0", | |
| "bg": "infinitejoy/wav2vec2-large-xls-r-300m-bulgarian", | |
| "gl": "ifrz/wav2vec2-large-xlsr-galician", | |
| "gu": "Harveenchadha/vakyansh-wav2vec2-gujarati-gnm-100", | |
| "kk": "aismlv/wav2vec2-large-xlsr-kazakh", | |
| "kn": "Harveenchadha/vakyansh-wav2vec2-kannada-knm-560", | |
| "lt": "DeividasM/wav2vec2-large-xlsr-53-lithuanian", | |
| "lv": "anton-l/wav2vec2-large-xlsr-53-latvian", | |
| "mk": "", # Konstantin-Bogdanoski/wav2vec2-macedonian-base | |
| "ml": "gvs/wav2vec2-large-xlsr-malayalam", | |
| "ms": "", # Duy/wav2vec2_malay | |
| "ro": "anton-l/wav2vec2-large-xlsr-53-romanian", | |
| "si": "IAmNotAnanth/wav2vec2-large-xls-r-300m-sinhala", | |
| "su": "cahya/wav2vec2-large-xlsr-sundanese", | |
| "sw": "", # Lians/fine-tune-wav2vec2-large-swahili | |
| "af": "", # ylacombe/wav2vec2-common_voice-af-demo | |
| "bs": "", | |
| "la": "", | |
| "my": "", | |
| "no": "NbAiLab/wav2vec2-xlsr-300m-norwegian", | |
| "zh-TW": "jonatasgrosman/wav2vec2-large-xlsr-53-chinese-zh-cn", | |
| "as": "", | |
| "eu": "", # cahya/wav2vec2-large-xlsr-basque # verify | |
| "ha": "infinitejoy/wav2vec2-large-xls-r-300m-hausa", | |
| "ht": "", | |
| "hy": "infinitejoy/wav2vec2-large-xls-r-300m-armenian", # no (.) | |
| "lo": "", | |
| "mg": "", | |
| "mn": "tugstugi/wav2vec2-large-xlsr-53-mongolian", | |
| "mt": "carlosdanielhernandezmena/wav2vec2-large-xlsr-53-maltese-64h", | |
| "pa": "kingabzpro/wav2vec2-large-xlsr-53-punjabi", | |
| "ps": "aamirhs/wav2vec2-large-xls-r-300m-pashto-colab", | |
| "sl": "anton-l/wav2vec2-large-xlsr-53-slovenian", | |
| "sn": "", | |
| "so": "", | |
| "tg": "", | |
| "tk": "", # Ragav/wav2vec2-tk | |
| "tt": "anton-l/wav2vec2-large-xlsr-53-tatar", | |
| "uz": "", # Mekhriddin/wav2vec2-large-xls-r-300m-uzbek-colab | |
| "yo": "ogbi/wav2vec2-large-mms-1b-yoruba-test", | |
| } | |
| def fix_code_language(translate_to, syntax="google"): | |
| if syntax == "google": | |
| # google-translator, gTTS | |
| replace_lang_code = {"zh": "zh-CN", "he": "iw", "zh-cn": "zh-CN"} | |
| elif syntax == "coqui": | |
| # coqui-xtts | |
| replace_lang_code = {"zh": "zh-cn", "zh-CN": "zh-cn", "zh-TW": "zh-cn"} | |
| new_code_lang = replace_lang_code.get(translate_to, translate_to) | |
| logger.debug(f"Fix code {translate_to} -> {new_code_lang}") | |
| return new_code_lang | |
| BARK_VOICES_LIST = { | |
| "de_speaker_0-Male BARK": "v2/de_speaker_0", | |
| "de_speaker_1-Male BARK": "v2/de_speaker_1", | |
| "de_speaker_2-Male BARK": "v2/de_speaker_2", | |
| "de_speaker_3-Female BARK": "v2/de_speaker_3", | |
| "de_speaker_4-Male BARK": "v2/de_speaker_4", | |
| "de_speaker_5-Male BARK": "v2/de_speaker_5", | |
| "de_speaker_6-Male BARK": "v2/de_speaker_6", | |
| "de_speaker_7-Male BARK": "v2/de_speaker_7", | |
| "de_speaker_8-Female BARK": "v2/de_speaker_8", | |
| "de_speaker_9-Male BARK": "v2/de_speaker_9", | |
| "en_speaker_0-Male BARK": "v2/en_speaker_0", | |
| "en_speaker_1-Male BARK": "v2/en_speaker_1", | |
| "en_speaker_2-Male BARK": "v2/en_speaker_2", | |
| "en_speaker_3-Male BARK": "v2/en_speaker_3", | |
| "en_speaker_4-Male BARK": "v2/en_speaker_4", | |
| "en_speaker_5-Male BARK": "v2/en_speaker_5", | |
| "en_speaker_6-Male BARK": "v2/en_speaker_6", | |
| "en_speaker_7-Male BARK": "v2/en_speaker_7", | |
| "en_speaker_8-Male BARK": "v2/en_speaker_8", | |
| "en_speaker_9-Female BARK": "v2/en_speaker_9", | |
| "es_speaker_0-Male BARK": "v2/es_speaker_0", | |
| "es_speaker_1-Male BARK": "v2/es_speaker_1", | |
| "es_speaker_2-Male BARK": "v2/es_speaker_2", | |
| "es_speaker_3-Male BARK": "v2/es_speaker_3", | |
| "es_speaker_4-Male BARK": "v2/es_speaker_4", | |
| "es_speaker_5-Male BARK": "v2/es_speaker_5", | |
| "es_speaker_6-Male BARK": "v2/es_speaker_6", | |
| "es_speaker_7-Male BARK": "v2/es_speaker_7", | |
| "es_speaker_8-Female BARK": "v2/es_speaker_8", | |
| "es_speaker_9-Female BARK": "v2/es_speaker_9", | |
| "fr_speaker_0-Male BARK": "v2/fr_speaker_0", | |
| "fr_speaker_1-Female BARK": "v2/fr_speaker_1", | |
| "fr_speaker_2-Female BARK": "v2/fr_speaker_2", | |
| "fr_speaker_3-Male BARK": "v2/fr_speaker_3", | |
| "fr_speaker_4-Male BARK": "v2/fr_speaker_4", | |
| "fr_speaker_5-Female BARK": "v2/fr_speaker_5", | |
| "fr_speaker_6-Male BARK": "v2/fr_speaker_6", | |
| "fr_speaker_7-Male BARK": "v2/fr_speaker_7", | |
| "fr_speaker_8-Male BARK": "v2/fr_speaker_8", | |
| "fr_speaker_9-Male BARK": "v2/fr_speaker_9", | |
| "hi_speaker_0-Female BARK": "v2/hi_speaker_0", | |
| "hi_speaker_1-Female BARK": "v2/hi_speaker_1", | |
| "hi_speaker_2-Male BARK": "v2/hi_speaker_2", | |
| "hi_speaker_3-Female BARK": "v2/hi_speaker_3", | |
| "hi_speaker_4-Female BARK": "v2/hi_speaker_4", | |
| "hi_speaker_5-Male BARK": "v2/hi_speaker_5", | |
| "hi_speaker_6-Male BARK": "v2/hi_speaker_6", | |
| "hi_speaker_7-Male BARK": "v2/hi_speaker_7", | |
| "hi_speaker_8-Male BARK": "v2/hi_speaker_8", | |
| "hi_speaker_9-Female BARK": "v2/hi_speaker_9", | |
| "it_speaker_0-Male BARK": "v2/it_speaker_0", | |
| "it_speaker_1-Male BARK": "v2/it_speaker_1", | |
| "it_speaker_2-Female BARK": "v2/it_speaker_2", | |
| "it_speaker_3-Male BARK": "v2/it_speaker_3", | |
| "it_speaker_4-Male BARK": "v2/it_speaker_4", | |
| "it_speaker_5-Male BARK": "v2/it_speaker_5", | |
| "it_speaker_6-Male BARK": "v2/it_speaker_6", | |
| "it_speaker_7-Female BARK": "v2/it_speaker_7", | |
| "it_speaker_8-Male BARK": "v2/it_speaker_8", | |
| "it_speaker_9-Female BARK": "v2/it_speaker_9", | |
| "ja_speaker_0-Female BARK": "v2/ja_speaker_0", | |
| "ja_speaker_1-Female BARK": "v2/ja_speaker_1", | |
| "ja_speaker_2-Male BARK": "v2/ja_speaker_2", | |
| "ja_speaker_3-Female BARK": "v2/ja_speaker_3", | |
| "ja_speaker_4-Female BARK": "v2/ja_speaker_4", | |
| "ja_speaker_5-Female BARK": "v2/ja_speaker_5", | |
| "ja_speaker_6-Male BARK": "v2/ja_speaker_6", | |
| "ja_speaker_7-Female BARK": "v2/ja_speaker_7", | |
| "ja_speaker_8-Female BARK": "v2/ja_speaker_8", | |
| "ja_speaker_9-Female BARK": "v2/ja_speaker_9", | |
| "ko_speaker_0-Female BARK": "v2/ko_speaker_0", | |
| "ko_speaker_1-Male BARK": "v2/ko_speaker_1", | |
| "ko_speaker_2-Male BARK": "v2/ko_speaker_2", | |
| "ko_speaker_3-Male BARK": "v2/ko_speaker_3", | |
| "ko_speaker_4-Male BARK": "v2/ko_speaker_4", | |
| "ko_speaker_5-Male BARK": "v2/ko_speaker_5", | |
| "ko_speaker_6-Male BARK": "v2/ko_speaker_6", | |
| "ko_speaker_7-Male BARK": "v2/ko_speaker_7", | |
| "ko_speaker_8-Male BARK": "v2/ko_speaker_8", | |
| "ko_speaker_9-Male BARK": "v2/ko_speaker_9", | |
| "pl_speaker_0-Male BARK": "v2/pl_speaker_0", | |
| "pl_speaker_1-Male BARK": "v2/pl_speaker_1", | |
| "pl_speaker_2-Male BARK": "v2/pl_speaker_2", | |
| "pl_speaker_3-Male BARK": "v2/pl_speaker_3", | |
| "pl_speaker_4-Female BARK": "v2/pl_speaker_4", | |
| "pl_speaker_5-Male BARK": "v2/pl_speaker_5", | |
| "pl_speaker_6-Female BARK": "v2/pl_speaker_6", | |
| "pl_speaker_7-Male BARK": "v2/pl_speaker_7", | |
| "pl_speaker_8-Male BARK": "v2/pl_speaker_8", | |
| "pl_speaker_9-Female BARK": "v2/pl_speaker_9", | |
| "pt_speaker_0-Male BARK": "v2/pt_speaker_0", | |
| "pt_speaker_1-Male BARK": "v2/pt_speaker_1", | |
| "pt_speaker_2-Male BARK": "v2/pt_speaker_2", | |
| "pt_speaker_3-Male BARK": "v2/pt_speaker_3", | |
| "pt_speaker_4-Male BARK": "v2/pt_speaker_4", | |
| "pt_speaker_5-Male BARK": "v2/pt_speaker_5", | |
| "pt_speaker_6-Male BARK": "v2/pt_speaker_6", | |
| "pt_speaker_7-Male BARK": "v2/pt_speaker_7", | |
| "pt_speaker_8-Male BARK": "v2/pt_speaker_8", | |
| "pt_speaker_9-Male BARK": "v2/pt_speaker_9", | |
| "ru_speaker_0-Male BARK": "v2/ru_speaker_0", | |
| "ru_speaker_1-Male BARK": "v2/ru_speaker_1", | |
| "ru_speaker_2-Male BARK": "v2/ru_speaker_2", | |
| "ru_speaker_3-Male BARK": "v2/ru_speaker_3", | |
| "ru_speaker_4-Male BARK": "v2/ru_speaker_4", | |
| "ru_speaker_5-Female BARK": "v2/ru_speaker_5", | |
| "ru_speaker_6-Female BARK": "v2/ru_speaker_6", | |
| "ru_speaker_7-Male BARK": "v2/ru_speaker_7", | |
| "ru_speaker_8-Male BARK": "v2/ru_speaker_8", | |
| "ru_speaker_9-Female BARK": "v2/ru_speaker_9", | |
| "tr_speaker_0-Male BARK": "v2/tr_speaker_0", | |
| "tr_speaker_1-Male BARK": "v2/tr_speaker_1", | |
| "tr_speaker_2-Male BARK": "v2/tr_speaker_2", | |
| "tr_speaker_3-Male BARK": "v2/tr_speaker_3", | |
| "tr_speaker_4-Female BARK": "v2/tr_speaker_4", | |
| "tr_speaker_5-Female BARK": "v2/tr_speaker_5", | |
| "tr_speaker_6-Male BARK": "v2/tr_speaker_6", | |
| "tr_speaker_7-Male BARK": "v2/tr_speaker_7", | |
| "tr_speaker_8-Male BARK": "v2/tr_speaker_8", | |
| "tr_speaker_9-Male BARK": "v2/tr_speaker_9", | |
| "zh_speaker_0-Male BARK": "v2/zh_speaker_0", | |
| "zh_speaker_1-Male BARK": "v2/zh_speaker_1", | |
| "zh_speaker_2-Male BARK": "v2/zh_speaker_2", | |
| "zh_speaker_3-Male BARK": "v2/zh_speaker_3", | |
| "zh_speaker_4-Female BARK": "v2/zh_speaker_4", | |
| "zh_speaker_5-Male BARK": "v2/zh_speaker_5", | |
| "zh_speaker_6-Female BARK": "v2/zh_speaker_6", | |
| "zh_speaker_7-Female BARK": "v2/zh_speaker_7", | |
| "zh_speaker_8-Male BARK": "v2/zh_speaker_8", | |
| "zh_speaker_9-Female BARK": "v2/zh_speaker_9", | |
| } | |
| VITS_VOICES_LIST = { | |
| "ar-facebook-mms VITS": "facebook/mms-tts-ara", | |
| # 'zh-facebook-mms VITS': 'facebook/mms-tts-cmn', | |
| "zh_Hakka-facebook-mms VITS": "facebook/mms-tts-hak", | |
| "zh_MinNan-facebook-mms VITS": "facebook/mms-tts-nan", | |
| # 'cs-facebook-mms VITS': 'facebook/mms-tts-ces', | |
| # 'da-facebook-mms VITS': 'facebook/mms-tts-dan', | |
| "nl-facebook-mms VITS": "facebook/mms-tts-nld", | |
| "en-facebook-mms VITS": "facebook/mms-tts-eng", | |
| "fi-facebook-mms VITS": "facebook/mms-tts-fin", | |
| "fr-facebook-mms VITS": "facebook/mms-tts-fra", | |
| "de-facebook-mms VITS": "facebook/mms-tts-deu", | |
| "el-facebook-mms VITS": "facebook/mms-tts-ell", | |
| "el_Ancient-facebook-mms VITS": "facebook/mms-tts-grc", | |
| "he-facebook-mms VITS": "facebook/mms-tts-heb", | |
| "hu-facebook-mms VITS": "facebook/mms-tts-hun", | |
| # 'it-facebook-mms VITS': 'facebook/mms-tts-ita', | |
| # 'ja-facebook-mms VITS': 'facebook/mms-tts-jpn', | |
| "ko-facebook-mms VITS": "facebook/mms-tts-kor", | |
| "fa-facebook-mms VITS": "facebook/mms-tts-fas", | |
| "pl-facebook-mms VITS": "facebook/mms-tts-pol", | |
| "pt-facebook-mms VITS": "facebook/mms-tts-por", | |
| "ru-facebook-mms VITS": "facebook/mms-tts-rus", | |
| "es-facebook-mms VITS": "facebook/mms-tts-spa", | |
| "tr-facebook-mms VITS": "facebook/mms-tts-tur", | |
| "uk-facebook-mms VITS": "facebook/mms-tts-ukr", | |
| "ur_arabic-facebook-mms VITS": "facebook/mms-tts-urd-script_arabic", | |
| "ur_devanagari-facebook-mms VITS": "facebook/mms-tts-urd-script_devanagari", | |
| "ur_latin-facebook-mms VITS": "facebook/mms-tts-urd-script_latin", | |
| "vi-facebook-mms VITS": "facebook/mms-tts-vie", | |
| "hi-facebook-mms VITS": "facebook/mms-tts-hin", | |
| "hi_Fiji-facebook-mms VITS": "facebook/mms-tts-hif", | |
| "id-facebook-mms VITS": "facebook/mms-tts-ind", | |
| "bn-facebook-mms VITS": "facebook/mms-tts-ben", | |
| "te-facebook-mms VITS": "facebook/mms-tts-tel", | |
| "mr-facebook-mms VITS": "facebook/mms-tts-mar", | |
| "ta-facebook-mms VITS": "facebook/mms-tts-tam", | |
| "jw-facebook-mms VITS": "facebook/mms-tts-jav", | |
| "jw_Suriname-facebook-mms VITS": "facebook/mms-tts-jvn", | |
| "ca-facebook-mms VITS": "facebook/mms-tts-cat", | |
| "ne-facebook-mms VITS": "facebook/mms-tts-nep", | |
| "th-facebook-mms VITS": "facebook/mms-tts-tha", | |
| "th_Northern-facebook-mms VITS": "facebook/mms-tts-nod", | |
| "sv-facebook-mms VITS": "facebook/mms-tts-swe", | |
| "am-facebook-mms VITS": "facebook/mms-tts-amh", | |
| "cy-facebook-mms VITS": "facebook/mms-tts-cym", | |
| # "et-facebook-mms VITS": "facebook/mms-tts-est", | |
| # "ht-facebook-mms VITS": "facebook/mms-tts-hrv", | |
| "is-facebook-mms VITS": "facebook/mms-tts-isl", | |
| "km-facebook-mms VITS": "facebook/mms-tts-khm", | |
| "km_Northern-facebook-mms VITS": "facebook/mms-tts-kxm", | |
| # "sk-facebook-mms VITS": "facebook/mms-tts-slk", | |
| "sq_Northern-facebook-mms VITS": "facebook/mms-tts-sqi", | |
| "az_South-facebook-mms VITS": "facebook/mms-tts-azb", | |
| "az_North_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-azj-script_cyrillic", | |
| "az_North_script_latin-facebook-mms VITS": "facebook/mms-tts-azj-script_latin", | |
| "bg-facebook-mms VITS": "facebook/mms-tts-bul", | |
| # "gl-facebook-mms VITS": "facebook/mms-tts-glg", | |
| "gu-facebook-mms VITS": "facebook/mms-tts-guj", | |
| "kk-facebook-mms VITS": "facebook/mms-tts-kaz", | |
| "kn-facebook-mms VITS": "facebook/mms-tts-kan", | |
| # "lt-facebook-mms VITS": "facebook/mms-tts-lit", | |
| "lv-facebook-mms VITS": "facebook/mms-tts-lav", | |
| # "mk-facebook-mms VITS": "facebook/mms-tts-mkd", | |
| "ml-facebook-mms VITS": "facebook/mms-tts-mal", | |
| "ms-facebook-mms VITS": "facebook/mms-tts-zlm", | |
| "ms_Central-facebook-mms VITS": "facebook/mms-tts-pse", | |
| "ms_Manado-facebook-mms VITS": "facebook/mms-tts-xmm", | |
| "ro-facebook-mms VITS": "facebook/mms-tts-ron", | |
| # "si-facebook-mms VITS": "facebook/mms-tts-sin", | |
| "sw-facebook-mms VITS": "facebook/mms-tts-swh", | |
| # "af-facebook-mms VITS": "facebook/mms-tts-afr", | |
| # "bs-facebook-mms VITS": "facebook/mms-tts-bos", | |
| "la-facebook-mms VITS": "facebook/mms-tts-lat", | |
| "my-facebook-mms VITS": "facebook/mms-tts-mya", | |
| # "no_Bokmål-facebook-mms VITS": "thomasht86/mms-tts-nob", # verify | |
| "as-facebook-mms VITS": "facebook/mms-tts-asm", | |
| "as_Nagamese-facebook-mms VITS": "facebook/mms-tts-nag", | |
| "eu-facebook-mms VITS": "facebook/mms-tts-eus", | |
| "ha-facebook-mms VITS": "facebook/mms-tts-hau", | |
| "ht-facebook-mms VITS": "facebook/mms-tts-hat", | |
| "hy_Western-facebook-mms VITS": "facebook/mms-tts-hyw", | |
| "lo-facebook-mms VITS": "facebook/mms-tts-lao", | |
| "mg-facebook-mms VITS": "facebook/mms-tts-mlg", | |
| "mn-facebook-mms VITS": "facebook/mms-tts-mon", | |
| # "mt-facebook-mms VITS": "facebook/mms-tts-mlt", | |
| "pa_Eastern-facebook-mms VITS": "facebook/mms-tts-pan", | |
| # "pa_Western-facebook-mms VITS": "facebook/mms-tts-pnb", | |
| # "ps-facebook-mms VITS": "facebook/mms-tts-pus", | |
| # "sl-facebook-mms VITS": "facebook/mms-tts-slv", | |
| "sn-facebook-mms VITS": "facebook/mms-tts-sna", | |
| "so-facebook-mms VITS": "facebook/mms-tts-son", | |
| "tg-facebook-mms VITS": "facebook/mms-tts-tgk", | |
| "tk_script_arabic-facebook-mms VITS": "facebook/mms-tts-tuk-script_arabic", | |
| "tk_script_latin-facebook-mms VITS": "facebook/mms-tts-tuk-script_latin", | |
| "tt-facebook-mms VITS": "facebook/mms-tts-tat", | |
| "tt_Crimean-facebook-mms VITS": "facebook/mms-tts-crh", | |
| "uz_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-uzb-script_cyrillic", | |
| "yo-facebook-mms VITS": "facebook/mms-tts-yor", | |
| "ay-facebook-mms VITS": "facebook/mms-tts-ayr", | |
| "bm-facebook-mms VITS": "facebook/mms-tts-bam", | |
| "ceb-facebook-mms VITS": "facebook/mms-tts-ceb", | |
| "ny-facebook-mms VITS": "facebook/mms-tts-nya", | |
| "dv-facebook-mms VITS": "facebook/mms-tts-div", | |
| "doi-facebook-mms VITS": "facebook/mms-tts-dgo", | |
| "ee-facebook-mms VITS": "facebook/mms-tts-ewe", | |
| "gn-facebook-mms VITS": "facebook/mms-tts-grn", | |
| "ilo-facebook-mms VITS": "facebook/mms-tts-ilo", | |
| "rw-facebook-mms VITS": "facebook/mms-tts-kin", | |
| "kri-facebook-mms VITS": "facebook/mms-tts-kri", | |
| "ku_script_arabic-facebook-mms VITS": "facebook/mms-tts-kmr-script_arabic", | |
| "ku_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-kmr-script_cyrillic", | |
| "ku_script_latin-facebook-mms VITS": "facebook/mms-tts-kmr-script_latin", | |
| "ckb-facebook-mms VITS": "razhan/mms-tts-ckb", # Verify w | |
| "ky-facebook-mms VITS": "facebook/mms-tts-kir", | |
| "lg-facebook-mms VITS": "facebook/mms-tts-lug", | |
| "mai-facebook-mms VITS": "facebook/mms-tts-mai", | |
| "or-facebook-mms VITS": "facebook/mms-tts-ory", | |
| "om-facebook-mms VITS": "facebook/mms-tts-orm", | |
| "qu_Huallaga-facebook-mms VITS": "facebook/mms-tts-qub", | |
| "qu_Lambayeque-facebook-mms VITS": "facebook/mms-tts-quf", | |
| "qu_South_Bolivian-facebook-mms VITS": "facebook/mms-tts-quh", | |
| "qu_North_Bolivian-facebook-mms VITS": "facebook/mms-tts-qul", | |
| "qu_Tena_Lowland-facebook-mms VITS": "facebook/mms-tts-quw", | |
| "qu_Ayacucho-facebook-mms VITS": "facebook/mms-tts-quy", | |
| "qu_Cusco-facebook-mms VITS": "facebook/mms-tts-quz", | |
| "qu_Cajamarca-facebook-mms VITS": "facebook/mms-tts-qvc", | |
| "qu_Eastern_Apurímac-facebook-mms VITS": "facebook/mms-tts-qve", | |
| "qu_Huamalíes_Dos_de_Mayo_Huánuco-facebook-mms VITS": "facebook/mms-tts-qvh", | |
| "qu_Margos_Yarowilca_Lauricocha-facebook-mms VITS": "facebook/mms-tts-qvm", | |
| "qu_North_Junín-facebook-mms VITS": "facebook/mms-tts-qvn", | |
| "qu_Napo-facebook-mms VITS": "facebook/mms-tts-qvo", | |
| "qu_San_Martín-facebook-mms VITS": "facebook/mms-tts-qvs", | |
| "qu_Huaylla_Wanca-facebook-mms VITS": "facebook/mms-tts-qvw", | |
| "qu_Northern_Pastaza-facebook-mms VITS": "facebook/mms-tts-qvz", | |
| "qu_Huaylas_Ancash-facebook-mms VITS": "facebook/mms-tts-qwh", | |
| "qu_Panao-facebook-mms VITS": "facebook/mms-tts-qxh", | |
| "qu_Salasaca_Highland-facebook-mms VITS": "facebook/mms-tts-qxl", | |
| "qu_Northern_Conchucos_Ancash-facebook-mms VITS": "facebook/mms-tts-qxn", | |
| "qu_Southern_Conchucos-facebook-mms VITS": "facebook/mms-tts-qxo", | |
| "qu_Cañar_Highland-facebook-mms VITS": "facebook/mms-tts-qxr", | |
| "sm-facebook-mms VITS": "facebook/mms-tts-smo", | |
| "ti-facebook-mms VITS": "facebook/mms-tts-tir", | |
| "ts-facebook-mms VITS": "facebook/mms-tts-tso", | |
| "ak-facebook-mms VITS": "facebook/mms-tts-aka", | |
| "ug_script_arabic-facebook-mms VITS": "facebook/mms-tts-uig-script_arabic", | |
| "ug_script_cyrillic-facebook-mms VITS": "facebook/mms-tts-uig-script_cyrillic", | |
| } | |
| OPENAI_TTS_CODES = [ | |
| "af", "ar", "hy", "az", "be", "bs", "bg", "ca", "zh", "hr", "cs", "da", | |
| "nl", "en", "et", "fi", "fr", "gl", "de", "el", "he", "hi", "hu", "is", | |
| "id", "it", "ja", "kn", "kk", "ko", "lv", "lt", "mk", "ms", "mr", "mi", | |
| "ne", "no", "fa", "pl", "pt", "ro", "ru", "sr", "sk", "sl", "es", "sw", | |
| "sv", "tl", "ta", "th", "tr", "uk", "ur", "vi", "cy", "zh-TW" | |
| ] | |
| OPENAI_TTS_MODELS = [ | |
| ">alloy OpenAI-TTS", | |
| ">echo OpenAI-TTS", | |
| ">fable OpenAI-TTS", | |
| ">onyx OpenAI-TTS", | |
| ">nova OpenAI-TTS", | |
| ">shimmer OpenAI-TTS", | |
| ">alloy HD OpenAI-TTS", | |
| ">echo HD OpenAI-TTS", | |
| ">fable HD OpenAI-TTS", | |
| ">onyx HD OpenAI-TTS", | |
| ">nova HD OpenAI-TTS", | |
| ">shimmer HD OpenAI-TTS" | |
| ] | |
| LANGUAGE_CODE_IN_THREE_LETTERS = { | |
| "Automatic detection": "aut", | |
| "ar": "ara", | |
| "zh": "chi", | |
| "cs": "cze", | |
| "da": "dan", | |
| "nl": "dut", | |
| "en": "eng", | |
| "fi": "fin", | |
| "fr": "fre", | |
| "de": "ger", | |
| "el": "gre", | |
| "he": "heb", | |
| "hu": "hun", | |
| "it": "ita", | |
| "ja": "jpn", | |
| "ko": "kor", | |
| "fa": "per", | |
| "pl": "pol", | |
| "pt": "por", | |
| "ru": "rus", | |
| "es": "spa", | |
| "tr": "tur", | |
| "uk": "ukr", | |
| "ur": "urd", | |
| "vi": "vie", | |
| "hi": "hin", | |
| "id": "ind", | |
| "bn": "ben", | |
| "te": "tel", | |
| "mr": "mar", | |
| "ta": "tam", | |
| "jw": "jav", | |
| "ca": "cat", | |
| "ne": "nep", | |
| "th": "tha", | |
| "sv": "swe", | |
| "am": "amh", | |
| "cy": "cym", | |
| "et": "est", | |
| "hr": "hrv", | |
| "is": "isl", | |
| "km": "khm", | |
| "sk": "slk", | |
| "sq": "sqi", | |
| "sr": "srp", | |
| } | |