Moore-Language-Space-ZeroGPU

Sleeping

App Files Files Community

ANYANTUDRE commited on Oct 22, 2024

Commit

f0dafb8

1 Parent(s): 5966f2d

fixed small bugs

Browse files

Files changed (4) hide show

app.py +7 -4
goai_helpers/goai_stt2.py +1 -1
goai_helpers/goai_tts.py +1 -1
goai_helpers/goai_ttt_tts_pipeline.py +1 -1

app.py CHANGED Viewed

@@ -11,7 +11,7 @@ login(token=auth_token)
 # list all files in the ./audios directory for the dropdown
 AUDIO_FILES = [f for f in os.listdir('./exples_voix') if os.path.isfile(os.path.join('./exples_voix', f))]
-MODELES_TTS = ["ArissBandoss/coqui-tts-moore-V1", "ArissBandoss/mms-tts-mos-V18"]
 MODELES_ASR = ["ArissBandoss/whisper-small-mos", "openai/whisper-large-v3-turbo"]
 LANGUAGES   = ["Automatic Detection"]
@@ -113,7 +113,7 @@ goai_ttt_tts_pipeline_if = gr.Interface(
               ["Ils achetèrent des troupeaux, firent construire des cases, parcoururent tout le pays pour offrir à leur mère et à leurs femmes les plus beaux bijoux, les plus belles étoffes.", "exple_voix_feminine.wav", None]
              ],
     cache_examples=False,
-    title="Démo des Modèles pour le Mooré: Traduction (Text-to-Text) et Synthèse Vocale (Text-to-Speech)",
     description=DESCRIPTION,
 )
@@ -137,14 +137,17 @@ goai_stt_ttt_pipeline_if = gr.Interface(
         gr.Slider(label="Chunk Length (s)", minimum=1, maximum=60, value=17.5, step=0.1),
         gr.Slider(label="Stride Length (s)", minimum=1, maximum=30, value=1, step=0.1),
     ],
-    outputs=[gr.Textbox(label="Output"), gr.File(label="Download Files")],
     examples=[["./audios/example1.mp3", "a ye ligdi"],
               ["./audios/example2.mp3", "zoe nimbãanega"],
               ["./audios/example3.mp3", "zãng-zãnga"],
               ["./audios/example4.mp3", "yõk foto"]
              ],
     cache_examples=False,
-    title="Mooré ASR",
     description=DESCRIPTION,
     flagging_mode="auto",
 )

 # list all files in the ./audios directory for the dropdown
 AUDIO_FILES = [f for f in os.listdir('./exples_voix') if os.path.isfile(os.path.join('./exples_voix', f))]
+MODELES_TTS = ["ArissBandoss/coqui-tts-moore-V1", "ArissBandoss/mms-tts-mos-male-17-V5"]
 MODELES_ASR = ["ArissBandoss/whisper-small-mos", "openai/whisper-large-v3-turbo"]
 LANGUAGES   = ["Automatic Detection"]
               ["Ils achetèrent des troupeaux, firent construire des cases, parcoururent tout le pays pour offrir à leur mère et à leurs femmes les plus beaux bijoux, les plus belles étoffes.", "exple_voix_feminine.wav", None]
              ],
     cache_examples=False,
+    title="Mooré TTS & Traduction",
     description=DESCRIPTION,
 )
         gr.Slider(label="Chunk Length (s)", minimum=1, maximum=60, value=17.5, step=0.1),
         gr.Slider(label="Stride Length (s)", minimum=1, maximum=30, value=1, step=0.1),
     ],
+    outputs=[
+        gr.Textbox(label="Texte Mooré"),
+        gr.Textbox(label="Texte Francais"),
+    ],
     examples=[["./audios/example1.mp3", "a ye ligdi"],
               ["./audios/example2.mp3", "zoe nimbãanega"],
               ["./audios/example3.mp3", "zãng-zãnga"],
               ["./audios/example4.mp3", "yõk foto"]
              ],
     cache_examples=False,
+    title="Mooré ASR & Traduction",
     description=DESCRIPTION,
     flagging_mode="auto",
 )

goai_helpers/goai_stt2.py CHANGED Viewed

@@ -51,7 +51,7 @@ def transcribe(
     if forced_decoder_ids:
         generate_kwargs["forced_decoder_ids"] = forced_decoder_ids
-    output = pipe(inputs, batch_size=batch_size, **generate_kwargs)
     transcription_text = output['text']

     if forced_decoder_ids:
         generate_kwargs["forced_decoder_ids"] = forced_decoder_ids
+    output = pipe(inputs, batch_size=batch_size, padding=True, truncation=True, **generate_kwargs)
     transcription_text = output['text']

goai_helpers/goai_tts.py CHANGED Viewed

@@ -32,7 +32,7 @@ def goai_tts(texte):
     start_time = time.time()
     # Charger le modèle TTS avec le token d'authentification
-    model_id = "ArissBandoss/mms-tts-mos-V18"
     synthesiser = pipeline("text-to-speech", model_id, device=device)
     # Inférence

     start_time = time.time()
     # Charger le modèle TTS avec le token d'authentification
+    model_id = "ArissBandoss/mms-tts-mos-male-17-V5"
     synthesiser = pipeline("text-to-speech", model_id, device=device)
     # Inférence

goai_helpers/goai_ttt_tts_pipeline.py CHANGED Viewed

@@ -34,7 +34,7 @@ def goai_many_tts(
         return sampling_rate, audio_array.numpy()
-    elif tts_model == "ArissBandoss/mms-tts-mos-V18":
         sample_rate, audio_data = goai_tts(text)
         return sample_rate, audio_data

         return sampling_rate, audio_array.numpy()
+    elif tts_model == "ArissBandoss/mms-tts-mos-male-17-V5":
         sample_rate, audio_data = goai_tts(text)
         return sample_rate, audio_data