AudreyMireille commited on
Commit
5378644
1 Parent(s): 07d7c03

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -13
app.py CHANGED
@@ -1,17 +1,13 @@
1
- from transformers import pipeline
2
- from datasets import load_dataset
3
- import soundfile as sf
4
  import torch
5
- synthetiser =pipeline('text-to-speech', model='microsoft/speecht5_tts')
6
- embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
7
- speaker_embedding = torch.tensor(embeddings_dataset[7306]["xvector"]).unsqueeze(0)
8
- speech = synthetiser("Hello everyone!", forward_params={"speaker_embeddings": speaker_embedding})
9
- sf.write("speech.wav", speech["audio"], samplerate=speech["sampling_rate"])
10
 
11
- import gradio as gr
12
- def text_to_speech(text):
13
- speech = synthetiser(text)
14
- return(speech['audio'])
15
 
 
 
 
 
 
16
  demo_text_to_speech = gr.Interface(text_to_speech, title="Text to speech converter", description="Enter a text here!", inputs='text', outputs='audio')
17
- demo_text_to_speech.launch()
 
1
+ from transformers import VitsModel, AutoTokenizer
 
 
2
  import torch
 
 
 
 
 
3
 
4
+ model = VitsModel.from_pretrained("facebook/mms-tts-eng")
5
+ tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-eng")
 
 
6
 
7
+ def generate_waveform(text):
8
+ inputs = tokenizer(text, return_tensors="pt")
9
+ with torch.no_grad():
10
+ output = model(**inputs).waveform
11
+ return (output)
12
  demo_text_to_speech = gr.Interface(text_to_speech, title="Text to speech converter", description="Enter a text here!", inputs='text', outputs='audio')
13
+ demo_text_to_speech.launch()