SeamlessOnDevice

Running

Tonic commited on Nov 20, 2023

Commit

b293439

•

1 Parent(s): 09d6d8c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -38,29 +38,25 @@ def speech_to_text(audio_data, tgt_lang):
     audio_input, _ = torchaudio.load(file_path)
     s2t_model = torch.jit.load("unity_on_device.ptl")
     with torch.no_grad():
-        text = s2t_model(audio_input, tgt_lang=languages[tgt_lang])
-    # Print the model's output for debugging
-    print("Speech to Text Model Output:", text)
-    return text
 def speech_to_speech_translation(audio_data, tgt_lang):
     file_path = save_audio(audio_data)
     audio_input, _ = torchaudio.load(file_path)
     s2st_model = torch.jit.load("unity_on_device.ptl")
     with torch.no_grad():
-        text, units, waveform = s2st_model(audio_input, tgt_lang=languages[tgt_lang])
-    # Print the model's output for debugging (optional)
-    print("Translated Text:", text)
     print("Units:", units)
     print("Waveform Shape:", waveform.shape)
-    output_file = "/tmp/result.wav"
-    torchaudio.save(output_file, waveform.unsqueeze(0), sample_rate=16000)
-    return text, output_file
 def create_interface():

     audio_input, _ = torchaudio.load(file_path)
     s2t_model = torch.jit.load("unity_on_device.ptl")
     with torch.no_grad():
+        model_output = s2t_model(audio_input, tgt_lang=languages[tgt_lang])
+    transcribed_text = model_output[0] if model_output else ""
+    print("Speech to Text Model Output:", transcribed_text)
+    return transcribed_text
 def speech_to_speech_translation(audio_data, tgt_lang):
     file_path = save_audio(audio_data)
     audio_input, _ = torchaudio.load(file_path)
     s2st_model = torch.jit.load("unity_on_device.ptl")
     with torch.no_grad():
+        translated_text, units, waveform = s2st_model(audio_input, tgt_lang=languages[tgt_lang])
+    output_file = "/tmp/result.wav"
+    torchaudio.save(output_file, waveform.unsqueeze(0), sample_rate=16000)
+    print("Translated Text:", translated_text)
     print("Units:", units)
     print("Waveform Shape:", waveform.shape)
+    return translated_text, output_file
 def create_interface():