sanchit-gandhi HF staff commited on
Commit
f805e49
1 Parent(s): 4666f0a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -0
app.py CHANGED
@@ -39,10 +39,22 @@ def speech_to_speech_translation(audio):
39
  return 16000, synthesised_speech
40
 
41
 
 
 
 
 
 
 
 
 
 
 
42
  demo = gr.Interface(
43
  fn=speech_to_speech_translation,
44
  inputs=gr.Audio(type="filepath"),
45
  outputs=gr.Audio(label="Generated Speech", type="numpy"),
46
  examples=[["./example.wav"]],
 
 
47
  )
48
  demo.launch()
 
39
  return 16000, synthesised_speech
40
 
41
 
42
+ title = "Cascaded STST"
43
+ description = """
44
+ Demo for cascaded speech-to-speech translation (STST), mapping from source speech in any language to target speech in English:
45
+
46
+ ![Cascaded STST](https://huggingface.co/datasets/huggingface-course/audio-course-images/resolve/main/s2st_cascaded.png "Diagram of cascaded speech to speech translation")
47
+
48
+ Demo uses OpenAI's [Whisper Base](https://huggingface.co/openai/whisper-base) model for speech translation, and Microsoft's
49
+ [SpeechT5 TTS](https://huggingface.co/microsoft/speecht5_tts) model for text-to-speech.
50
+ """
51
+
52
  demo = gr.Interface(
53
  fn=speech_to_speech_translation,
54
  inputs=gr.Audio(type="filepath"),
55
  outputs=gr.Audio(label="Generated Speech", type="numpy"),
56
  examples=[["./example.wav"]],
57
+ title=title,
58
+ description=description,
59
  )
60
  demo.launch()