Ardha commited on
Commit
2c019ff
1 Parent(s): 2be9bdd
Files changed (1) hide show
  1. app.py +4 -57
app.py CHANGED
@@ -219,17 +219,12 @@ print("rmvpe model loaded.")
219
  initial_md = """
220
  # RVC text-to-speech demo
221
 
222
- This is a text-to-speech demo of RVC moe models of [rvc_okiba](https://huggingface.co/litagin/rvc_okiba) using [edge-tts](https://github.com/rany2/edge-tts).
223
-
224
  Input text ➡[(edge-tts)](https://github.com/rany2/edge-tts)➡ Speech mp3 file ➡[(RVC)](https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI)➡ Final output
225
 
226
  This runs on the 🤗 server's cpu, so it may be slow.
227
 
228
- Although the models are trained on Japanese voices and intended for Japanese text, they can also be used with other languages with the corresponding edge-tts speaker (but possibly with a Japanese accent).
229
-
230
  Input characters are limited to 280 characters, and the speech audio is limited to 20 seconds in this 🤗 space.
231
 
232
- [Visit this GitHub repo](https://github.com/litagin02/rvc-tts-webui) for running locally with your models and GPU!
233
  """
234
 
235
  app = gr.Blocks()
@@ -238,7 +233,7 @@ with app:
238
  with gr.Row():
239
  with gr.Column():
240
  model_name = gr.Dropdown(
241
- label="Model (all models except man-_ are girl models)",
242
  choices=models,
243
  value=models[0],
244
  )
@@ -257,7 +252,7 @@ with app:
257
  minimum=0,
258
  maximum=1,
259
  label="Index rate",
260
- value=1,
261
  interactive=True,
262
  )
263
  protect0 = gr.Slider(
@@ -310,56 +305,8 @@ with app:
310
  examples_per_page=100,
311
  examples=[
312
  ["これは日本語テキストから音声への変換デモです。", "ja-JP-NanamiNeural-Female"],
313
- [
314
- "This is an English text to speech conversation demo.",
315
- "en-US-AriaNeural-Female",
316
- ],
317
- ["这是一个中文文本到语音的转换演示。", "zh-CN-XiaoxiaoNeural-Female"],
318
- ["한국어 텍스트에서 음성으로 변환하는 데모입니다.", "ko-KR-SunHiNeural-Female"],
319
- [
320
- "Il s'agit d'une démo de conversion du texte français à la parole.",
321
- "fr-FR-DeniseNeural-Female",
322
- ],
323
- [
324
- "Dies ist eine Demo zur Umwandlung von Deutsch in Sprache.",
325
- "de-DE-AmalaNeural-Female",
326
- ],
327
- [
328
- "Tämä on suomenkielinen tekstistä puheeksi -esittely.",
329
- "fi-FI-NooraNeural-Female",
330
- ],
331
- [
332
- "Это демонстрационный пример преобразования русского текста в речь.",
333
- "ru-RU-SvetlanaNeural-Female",
334
- ],
335
- [
336
- "Αυτή είναι μια επίδειξη μετατροπής ελληνικού κειμένου σε ομιλία.",
337
- "el-GR-AthinaNeural-Female",
338
- ],
339
- [
340
- "Esta es una demostración de conversión de texto a voz en español.",
341
- "es-ES-ElviraNeural-Female",
342
- ],
343
- [
344
- "Questa è una dimostrazione di sintesi vocale in italiano.",
345
- "it-IT-ElsaNeural-Female",
346
- ],
347
- [
348
- "Esta é uma demonstração de conversão de texto em fala em português.",
349
- "pt-PT-RaquelNeural-Female",
350
- ],
351
- [
352
- "Це демонстрація тексту до мовлення українською мовою.",
353
- "uk-UA-PolinaNeural-Female",
354
- ],
355
- [
356
- "هذا عرض توضيحي عربي لتحويل النص إلى كلام.",
357
- "ar-EG-SalmaNeural-Female",
358
- ],
359
- [
360
- "இது தமிழ் உரையிலிருந்து பேச்சு மாற்ற டெமோ.",
361
- "ta-IN-PallaviNeural-Female",
362
- ],
363
  ],
364
  inputs=[tts_text, tts_voice],
365
  )
 
219
  initial_md = """
220
  # RVC text-to-speech demo
221
 
 
 
222
  Input text ➡[(edge-tts)](https://github.com/rany2/edge-tts)➡ Speech mp3 file ➡[(RVC)](https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI)➡ Final output
223
 
224
  This runs on the 🤗 server's cpu, so it may be slow.
225
 
 
 
226
  Input characters are limited to 280 characters, and the speech audio is limited to 20 seconds in this 🤗 space.
227
 
 
228
  """
229
 
230
  app = gr.Blocks()
 
233
  with gr.Row():
234
  with gr.Column():
235
  model_name = gr.Dropdown(
236
+ label="Model",
237
  choices=models,
238
  value=models[0],
239
  )
 
252
  minimum=0,
253
  maximum=1,
254
  label="Index rate",
255
+ value=0.5,
256
  interactive=True,
257
  )
258
  protect0 = gr.Slider(
 
305
  examples_per_page=100,
306
  examples=[
307
  ["これは日本語テキストから音声への変換デモです。", "ja-JP-NanamiNeural-Female"],
308
+ ["This is an English text to speech conversation demo.", "en-GB-MaisieNeural-Female"],
309
+ ["Ini adalah teks percobaan menggunakan Bahasa Indonesia", "id-ID-GadisNeural-Female"],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
310
  ],
311
  inputs=[tts_text, tts_voice],
312
  )