Spaces:

aurelben
/

parlons-nous

Sleeping

aurelben commited on Apr 28

Commit

419feaa

•

1 Parent(s): c451935

change whisper version

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,6 +7,9 @@ from groq import Groq
 from transformers import pipeline
 from TTS.api import TTS
 MODEL_NAME = "openai/whisper-large-v3"
 BATCH_SIZE = 8
 FILE_LIMIT_MB = 1000
@@ -75,7 +78,7 @@ def process_audio(input_audio, new_chunk):
     stream, transcription = transcribe(input_audio, new_chunk)
     text = autocomplete(transcription)
     print (transcription, text)
-    api = TTS("tts_models/multilingual/multi-dataset/xtts_v2", gpu=True)
     api.tts_to_file(text, file_path="output.wav", speaker="Ana Florence",language="fr", split_sentences=True)
     audio = "./output.wav"
     return stream, text, audio

 from transformers import pipeline
 from TTS.api import TTS
+# Get device
+device = "cuda" if torch.cuda.is_available() else "cpu"
 MODEL_NAME = "openai/whisper-large-v3"
 BATCH_SIZE = 8
 FILE_LIMIT_MB = 1000
     stream, transcription = transcribe(input_audio, new_chunk)
     text = autocomplete(transcription)
     print (transcription, text)
+    api = TTS("tts_models/de/thorsten/tacotron2-DDC").to(device)
     api.tts_to_file(text, file_path="output.wav", speaker="Ana Florence",language="fr", split_sentences=True)
     audio = "./output.wav"
     return stream, text, audio