File size: 556 Bytes
5378644
7e5800b
c56c850
7e5800b
5378644
 
7e5800b
5378644
 
 
 
 
7e5800b
5378644
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
from transformers import VitsModel, AutoTokenizer
import torch
import gradio as gr

model = VitsModel.from_pretrained("facebook/mms-tts-eng")
tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-eng")

def generate_waveform(text):
    inputs = tokenizer(text, return_tensors="pt")
    with torch.no_grad():
        output = model(**inputs).waveform
    return (output)
demo_text_to_speech = gr.Interface(text_to_speech, title="Text to speech converter", description="Enter a text here!", inputs='text', outputs='audio')
demo_text_to_speech.launch()