arnavmehta7 commited on
Commit
9f8a599
1 Parent(s): 779952a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -14
app.py CHANGED
@@ -5,7 +5,6 @@ import librosa
5
  from pathlib import Path
6
  import tempfile, torchaudio
7
  from transformers import pipeline
8
- from uuid import uuid4
9
 
10
  # Load the MARS5 model
11
  mars5, config_class = torch.hub.load('Camb-ai/mars5-tts', 'mars5_english', trust_repo=True)
@@ -24,16 +23,6 @@ def transcribe_file(f: str) -> str:
24
  # Function to process the text and audio input and generate the synthesized output
25
  def synthesize(text, audio_file, transcript, kwargs_dict):
26
  print(f">>>>>>> Kwargs dict: {kwargs_dict}")
27
- # audio_file = Path(audio_file)
28
- # temp_file = f"{uuid4()}.{audio_file.suffix}"
29
-
30
- # # copying the audio_file
31
- # with open(audio_file, 'rb') as src, open(temp_file, 'wb') as dst:
32
- # dst.write(src.read())
33
-
34
- # audio_file = temp_file
35
-
36
- print(f">>>>> synthesizing! audio_file: {audio_file}")
37
  if not transcript:
38
  transcript = transcribe_file(audio_file)
39
 
@@ -67,7 +56,9 @@ defaults = {
67
 
68
 
69
  with gr.Blocks() as demo:
70
- gr.Markdown("## MARS5 TTS Demo\nEnter text and upload an audio file to clone the voice and generate synthesized speech using MARS5 TTS.")
 
 
71
  text = gr.Textbox(label="Text to synthesize")
72
  audio_file = gr.Audio(label="Audio file to clone from", type="filepath")
73
 
@@ -143,8 +134,8 @@ with gr.Blocks() as demo:
143
  # Add examples
144
  defaults = [0.8, -1, 0.2, 1.0, 2.6, 0.4, 100, 3, True]
145
  examples = [
146
- ["Today is a wonderful day!", "female_speaker_1.flac", "People look, but no one ever finds it.", *defaults],
147
- ["You guys need to figure this out.", "male_speaker_1.flac", "Ask her to bring these things with her from the store.", *defaults]
148
  ]
149
 
150
  gr.Examples(
 
5
  from pathlib import Path
6
  import tempfile, torchaudio
7
  from transformers import pipeline
 
8
 
9
  # Load the MARS5 model
10
  mars5, config_class = torch.hub.load('Camb-ai/mars5-tts', 'mars5_english', trust_repo=True)
 
23
  # Function to process the text and audio input and generate the synthesized output
24
  def synthesize(text, audio_file, transcript, kwargs_dict):
25
  print(f">>>>>>> Kwargs dict: {kwargs_dict}")
 
 
 
 
 
 
 
 
 
 
26
  if not transcript:
27
  transcript = transcribe_file(audio_file)
28
 
 
56
 
57
 
58
  with gr.Blocks() as demo:
59
+ link = "https://github.com/Camb-ai/MARS5-TTS"
60
+ gr.Markdown("## MARS5 TTS Demo\nEnter text and upload an audio file to clone the voice and generate synthesized speech using **[MARS5-TTS]({link})**")
61
+
62
  text = gr.Textbox(label="Text to synthesize")
63
  audio_file = gr.Audio(label="Audio file to clone from", type="filepath")
64
 
 
134
  # Add examples
135
  defaults = [0.8, -1, 0.2, 1.0, 2.6, 0.4, 100, 3, True]
136
  examples = [
137
+ ["Can you please go there and figure it out?", "female_speaker_1.flac", "People look, but no one ever finds it.", *defaults],
138
+ ["Hey, do you need my help?", "male_speaker_1.flac", "Ask her to bring these things with her from the store.", *defaults]
139
  ]
140
 
141
  gr.Examples(