Yuyang2022 commited on
Commit
ac54435
1 Parent(s): 115a88e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +214 -1
app.py CHANGED
@@ -5,7 +5,7 @@ from neon_tts_plugin_coqui import CoquiTTS
5
  import os
6
  import time
7
  from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
8
- from flores200_codes import flores_codes
9
 
10
  pipe = pipeline(model="Yuyang2022/yue") # change to "your-username/the-name-you-picked"
11
  LANGUAGES = list(CoquiTTS.langs.keys())
@@ -76,6 +76,219 @@ if __name__ == "__main__":
76
 
77
  model_dict = load_models()
78
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
79
  lang_codes = list(flores_codes.keys())
80
 
81
  # define gradio demo
 
5
  import os
6
  import time
7
  from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
8
+ #from flores200_codes import flores_codes
9
 
10
  pipe = pipeline(model="Yuyang2022/yue") # change to "your-username/the-name-you-picked"
11
  LANGUAGES = list(CoquiTTS.langs.keys())
 
76
 
77
  model_dict = load_models()
78
 
79
+ codes_as_string = '''Acehnese (Arabic script) ace_Arab
80
+ Acehnese (Latin script) ace_Latn
81
+ Mesopotamian Arabic acm_Arab
82
+ Ta’izzi-Adeni Arabic acq_Arab
83
+ Tunisian Arabic aeb_Arab
84
+ Afrikaans afr_Latn
85
+ South Levantine Arabic ajp_Arab
86
+ Akan aka_Latn
87
+ Amharic amh_Ethi
88
+ North Levantine Arabic apc_Arab
89
+ Modern Standard Arabic arb_Arab
90
+ Modern Standard Arabic (Romanized) arb_Latn
91
+ Najdi Arabic ars_Arab
92
+ Moroccan Arabic ary_Arab
93
+ Egyptian Arabic arz_Arab
94
+ Assamese asm_Beng
95
+ Asturian ast_Latn
96
+ Awadhi awa_Deva
97
+ Central Aymara ayr_Latn
98
+ South Azerbaijani azb_Arab
99
+ North Azerbaijani azj_Latn
100
+ Bashkir bak_Cyrl
101
+ Bambara bam_Latn
102
+ Balinese ban_Latn
103
+ Belarusian bel_Cyrl
104
+ Bemba bem_Latn
105
+ Bengali ben_Beng
106
+ Bhojpuri bho_Deva
107
+ Banjar (Arabic script) bjn_Arab
108
+ Banjar (Latin script) bjn_Latn
109
+ Standard Tibetan bod_Tibt
110
+ Bosnian bos_Latn
111
+ Buginese bug_Latn
112
+ Bulgarian bul_Cyrl
113
+ Catalan cat_Latn
114
+ Cebuano ceb_Latn
115
+ Czech ces_Latn
116
+ Chokwe cjk_Latn
117
+ Central Kurdish ckb_Arab
118
+ Crimean Tatar crh_Latn
119
+ Welsh cym_Latn
120
+ Danish dan_Latn
121
+ German deu_Latn
122
+ Southwestern Dinka dik_Latn
123
+ Dyula dyu_Latn
124
+ Dzongkha dzo_Tibt
125
+ Greek ell_Grek
126
+ English eng_Latn
127
+ Esperanto epo_Latn
128
+ Estonian est_Latn
129
+ Basque eus_Latn
130
+ Ewe ewe_Latn
131
+ Faroese fao_Latn
132
+ Fijian fij_Latn
133
+ Finnish fin_Latn
134
+ Fon fon_Latn
135
+ French fra_Latn
136
+ Friulian fur_Latn
137
+ Nigerian Fulfulde fuv_Latn
138
+ Scottish Gaelic gla_Latn
139
+ Irish gle_Latn
140
+ Galician glg_Latn
141
+ Guarani grn_Latn
142
+ Gujarati guj_Gujr
143
+ Haitian Creole hat_Latn
144
+ Hausa hau_Latn
145
+ Hebrew heb_Hebr
146
+ Hindi hin_Deva
147
+ Chhattisgarhi hne_Deva
148
+ Croatian hrv_Latn
149
+ Hungarian hun_Latn
150
+ Armenian hye_Armn
151
+ Igbo ibo_Latn
152
+ Ilocano ilo_Latn
153
+ Indonesian ind_Latn
154
+ Icelandic isl_Latn
155
+ Italian ita_Latn
156
+ Javanese jav_Latn
157
+ Japanese jpn_Jpan
158
+ Kabyle kab_Latn
159
+ Jingpho kac_Latn
160
+ Kamba kam_Latn
161
+ Kannada kan_Knda
162
+ Kashmiri (Arabic script) kas_Arab
163
+ Kashmiri (Devanagari script) kas_Deva
164
+ Georgian kat_Geor
165
+ Central Kanuri (Arabic script) knc_Arab
166
+ Central Kanuri (Latin script) knc_Latn
167
+ Kazakh kaz_Cyrl
168
+ Kabiyè kbp_Latn
169
+ Kabuverdianu kea_Latn
170
+ Khmer khm_Khmr
171
+ Kikuyu kik_Latn
172
+ Kinyarwanda kin_Latn
173
+ Kyrgyz kir_Cyrl
174
+ Kimbundu kmb_Latn
175
+ Northern Kurdish kmr_Latn
176
+ Kikongo kon_Latn
177
+ Korean kor_Hang
178
+ Lao lao_Laoo
179
+ Ligurian lij_Latn
180
+ Limburgish lim_Latn
181
+ Lingala lin_Latn
182
+ Lithuanian lit_Latn
183
+ Lombard lmo_Latn
184
+ Latgalian ltg_Latn
185
+ Luxembourgish ltz_Latn
186
+ Luba-Kasai lua_Latn
187
+ Ganda lug_Latn
188
+ Luo luo_Latn
189
+ Mizo lus_Latn
190
+ Standard Latvian lvs_Latn
191
+ Magahi mag_Deva
192
+ Maithili mai_Deva
193
+ Malayalam mal_Mlym
194
+ Marathi mar_Deva
195
+ Minangkabau (Arabic script) min_Arab
196
+ Minangkabau (Latin script) min_Latn
197
+ Macedonian mkd_Cyrl
198
+ Plateau Malagasy plt_Latn
199
+ Maltese mlt_Latn
200
+ Meitei (Bengali script) mni_Beng
201
+ Halh Mongolian khk_Cyrl
202
+ Mossi mos_Latn
203
+ Maori mri_Latn
204
+ Burmese mya_Mymr
205
+ Dutch nld_Latn
206
+ Norwegian Nynorsk nno_Latn
207
+ Norwegian Bokmål nob_Latn
208
+ Nepali npi_Deva
209
+ Northern Sotho nso_Latn
210
+ Nuer nus_Latn
211
+ Nyanja nya_Latn
212
+ Occitan oci_Latn
213
+ West Central Oromo gaz_Latn
214
+ Odia ory_Orya
215
+ Pangasinan pag_Latn
216
+ Eastern Panjabi pan_Guru
217
+ Papiamento pap_Latn
218
+ Western Persian pes_Arab
219
+ Polish pol_Latn
220
+ Portuguese por_Latn
221
+ Dari prs_Arab
222
+ Southern Pashto pbt_Arab
223
+ Ayacucho Quechua quy_Latn
224
+ Romanian ron_Latn
225
+ Rundi run_Latn
226
+ Russian rus_Cyrl
227
+ Sango sag_Latn
228
+ Sanskrit san_Deva
229
+ Santali sat_Olck
230
+ Sicilian scn_Latn
231
+ Shan shn_Mymr
232
+ Sinhala sin_Sinh
233
+ Slovak slk_Latn
234
+ Slovenian slv_Latn
235
+ Samoan smo_Latn
236
+ Shona sna_Latn
237
+ Sindhi snd_Arab
238
+ Somali som_Latn
239
+ Southern Sotho sot_Latn
240
+ Spanish spa_Latn
241
+ Tosk Albanian als_Latn
242
+ Sardinian srd_Latn
243
+ Serbian srp_Cyrl
244
+ Swati ssw_Latn
245
+ Sundanese sun_Latn
246
+ Swedish swe_Latn
247
+ Swahili swh_Latn
248
+ Silesian szl_Latn
249
+ Tamil tam_Taml
250
+ Tatar tat_Cyrl
251
+ Telugu tel_Telu
252
+ Tajik tgk_Cyrl
253
+ Tagalog tgl_Latn
254
+ Thai tha_Thai
255
+ Tigrinya tir_Ethi
256
+ Tamasheq (Latin script) taq_Latn
257
+ Tamasheq (Tifinagh script) taq_Tfng
258
+ Tok Pisin tpi_Latn
259
+ Tswana tsn_Latn
260
+ Tsonga tso_Latn
261
+ Turkmen tuk_Latn
262
+ Tumbuka tum_Latn
263
+ Turkish tur_Latn
264
+ Twi twi_Latn
265
+ Central Atlas Tamazight tzm_Tfng
266
+ Uyghur uig_Arab
267
+ Ukrainian ukr_Cyrl
268
+ Umbundu umb_Latn
269
+ Urdu urd_Arab
270
+ Northern Uzbek uzn_Latn
271
+ Venetian vec_Latn
272
+ Vietnamese vie_Latn
273
+ Waray war_Latn
274
+ Wolof wol_Latn
275
+ Xhosa xho_Latn
276
+ Eastern Yiddish ydd_Hebr
277
+ Yoruba yor_Latn
278
+ Yue Chinese yue_Hant
279
+ Chinese (Simplified) zho_Hans
280
+ Chinese (Traditional) zho_Hant
281
+ Standard Malay zsm_Latn
282
+ Zulu zul_Latn'''
283
+
284
+ codes_as_string = codes_as_string.split('\n')
285
+
286
+ flores_codes = {}
287
+ for code in codes_as_string:
288
+ lang, lang_code = code.split('\t')
289
+ flores_codes[lang] = lang_code
290
+
291
+
292
  lang_codes = list(flores_codes.keys())
293
 
294
  # define gradio demo