XTTS_V1_CPU_working

Running

Vaibhav Srivastav commited on Sep 14, 2023

Commit

33e0dc8

•

1 Parent(s): 194fffd

up

Files changed (2) hide show

app.py CHANGED Viewed

@@ -3,12 +3,12 @@ from TTS.api import TTS
 tts = TTS("tts_models/multilingual/multi-dataset/xtts_v1", gpu=True)
-def predict(prompt, audio_file_pth):
     tts.tts_to_file(text=prompt,
                 file_path="output.wav",
                 speaker_wav=audio_file_pth,
-                language="en")
     return gr.make_waveform(audio="output.wav",)
@@ -19,6 +19,7 @@ gr.Interface(
     fn=predict,
     inputs=[
         gr.Textbox(label="Prompt", info = "One or two sentences at a time is better* (max: 10)", placeholder = "It took me quite a long time to develop a voice, and now that I have it I'm not going to be silent.",),
         gr.Audio(label="Upload Speaker WAV", type="filepath"),
     ],
     outputs=[

 tts = TTS("tts_models/multilingual/multi-dataset/xtts_v1", gpu=True)
+def predict(prompt, language, audio_file_pth):
     tts.tts_to_file(text=prompt,
                 file_path="output.wav",
                 speaker_wav=audio_file_pth,
+                language=language)
     return gr.make_waveform(audio="output.wav",)
     fn=predict,
     inputs=[
         gr.Textbox(label="Prompt", info = "One or two sentences at a time is better* (max: 10)", placeholder = "It took me quite a long time to develop a voice, and now that I have it I'm not going to be silent.",),
+        gr.Dropdown(choices=["en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cz", "ar", "zh"], max_choices=1),
         gr.Audio(label="Upload Speaker WAV", type="filepath"),
     ],
     outputs=[

requirements.txt CHANGED Viewed

	@@ -0,0 +1 @@


1	+ TTS