mars5_space

Paused

App Files Files Community

arnavmehta7 commited on Jun 8

Commit

0b5b973

•

1 Parent(s): 6ae1eee

added the code

Browse files

Files changed (2) hide show

app.py +47 -4
requirements.txt +36 -0

app.py CHANGED Viewed

@@ -1,7 +1,50 @@
 import gradio as gr
-def greet(name):
-    return "Hello " + name + "!!"
-demo = gr.Interface(fn=greet, inputs="text", outputs="text")
-demo.launch()

 import gradio as gr
+import torch
+import librosa
+import IPython.display as ipd
+from pathlib import Path
+import tempfile, torchaudio
+# Load the MARS5 model
+mars5, config_class = torch.hub.load('Camb-ai/mars5-tts', 'mars5_english', trust_repo=True)
+# Default reference audio and transcript
+# default_audio_path = "example.wav"
+# default_transcript = "We actually haven't managed to meet demand."
+# Function to process the text and audio input and generate the synthesized output
+def synthesize(text, audio_file, transcript):
+    # Load the reference audio
+    wav, sr = librosa.load(audio_file, sr=mars5.sr, mono=True)
+    wav = torch.from_numpy(wav)
+    # Define the configuration for the TTS model
+    deep_clone = True
+    cfg = config_class(deep_clone=deep_clone, rep_penalty_window=100, top_k=100, temperature=0.7, freq_penalty=3)
+    # Generate the synthesized audio
+    ar_codes, wav_out = mars5.tts(text, wav, transcript, cfg=cfg)
+    # Save the synthesized audio to a temporary file
+    output_path = Path(tempfile.mktemp(suffix=".wav"))
+    torchaudio.save(output_path, wav_out.unsqueeze(0), mars5.sr)
+    return str(output_path)
+# Create the Gradio interface
+interface = gr.Interface(
+    fn=synthesize,
+    inputs=[
+        gr.Textbox(label="Text to synthesize"),
+        gr.Audio(label="Audio file to clone from", type="filepath"),
+        gr.Textbox(label="Uploaded audio file transcript"),
+    ],
+    outputs=gr.Audio(label="Synthesized Audio"),
+    title="MARS5 TTS Demo",
+    description="Enter text and upload an audio file to clone the voice and generate synthesized speech using MARS5 TTS."
+)
+# Launch the Gradio app
+interface.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,36 @@

+ffmpeg-python
+python-dotenv
+pysrt
+pydub
+torchserve
+torch-model-archiver
+torch-workflow-archiver
+portalocker
+tenacity
+httpx
+python-Levenshtein
+nvgpu
+torch
+torchvision
+torchtext
+torchaudio
+speechtokenizer
+matplotlib
+pandas
+numpy
+ToJyutping
+pypinyin
+phonemizer
+gruut-ipa
+dateparser~=1.1.8
+langcodes
+language-data
+vocos
+einops
+scipy
+onnxruntime
+unidecode
+encodec
+faster-whisper
+tiktoken
+librosa