Spaces:

gitgato
/

gitgato-tr-xtts

Runtime error

App Files Files Community

gitgato commited on Jun 24, 2024

Commit

cb4e037

verified ·

1 Parent(s): 11ed18a

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -8

app.py CHANGED Viewed

@@ -3,15 +3,15 @@ import torch
 from datasets import load_dataset
 from transformers import pipeline, SpeechT5Processor, SpeechT5HifiGan, SpeechT5ForTextToSpeech
-model_id = "gitgato/tr-xtts"  # update with your model id
-# pipe = pipeline("automatic-speech-recognition", model=model_id)
 model = SpeechT5ForTextToSpeech.from_pretrained(model_id)
 vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
 embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
 speaker_embeddings = torch.tensor(embeddings_dataset[7440]["xvector"]).unsqueeze(0)
 # checkpoint = "microsoft/speecht5_tts"
-processor = SpeechT5Processor.from_pretrained(model_id)
 replacements = [
     ("à", "a"),
@@ -30,7 +30,7 @@ replacements = [
 title = "Text-to-Speech"
 description = """
-Demo for text-to-speech translation in French. Demo uses [Sandiago21/speecht5_finetuned_facebook_voxpopuli_french](https://huggingface.co/Sandiago21/speecht5_finetuned_facebook_voxpopuli_french) checkpoint, which is based on Microsoft's
 [SpeechT5 TTS](https://huggingface.co/microsoft/speecht5_tts) model and is fine-tuned in French Audio dataset
 ![Text-to-Speech (TTS)"](https://geekflare.com/wp-content/uploads/2021/07/texttospeech-1200x385.png "Diagram of Text-to-Speech (TTS)")
 """
@@ -53,9 +53,7 @@ syntesize_speech_gradio = gr.Interface(
     synthesize_speech,
     inputs = gr.Textbox(label="Text", placeholder="Type something here..."),
     outputs=gr.Audio(),
-    examples=["Hola, probando audio."],
     title=title,
     description=description,
-).launch()

 from datasets import load_dataset
 from transformers import pipeline, SpeechT5Processor, SpeechT5HifiGan, SpeechT5ForTextToSpeech
+model_id = "gitgato/tr-tts"  # update with your model id
+pipe = pipeline("text-to-speech", model="gitgato/tr-xtts")
 model = SpeechT5ForTextToSpeech.from_pretrained(model_id)
 vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
 embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
 speaker_embeddings = torch.tensor(embeddings_dataset[7440]["xvector"]).unsqueeze(0)
 # checkpoint = "microsoft/speecht5_tts"
+processor = AutoProcessor.from_pretrained("gitgato/tr-xtts")
 replacements = [
     ("à", "a"),
 title = "Text-to-Speech"
 description = """
+Demo for text-to-speech translation in French. Demo uses [gitgato/trtts](https://huggingface.co) checkpoint, which is based on Microsoft's
 [SpeechT5 TTS](https://huggingface.co/microsoft/speecht5_tts) model and is fine-tuned in French Audio dataset
 ![Text-to-Speech (TTS)"](https://geekflare.com/wp-content/uploads/2021/07/texttospeech-1200x385.png "Diagram of Text-to-Speech (TTS)")
 """
     synthesize_speech,
     inputs = gr.Textbox(label="Text", placeholder="Type something here..."),
     outputs=gr.Audio(),
+    examples=["Je n'entrerai pas dans les détails, mais je profiterai des secondes qui me restent pour exposer la position ALDE sur le marquage CE, un des points cruciaux de ce rapport."],
     title=title,
     description=description,
+).launch()