cotxetj commited on
Commit
58cb1a8
1 Parent(s): 1eac7b5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -10
app.py CHANGED
@@ -33,18 +33,18 @@ pipe = pipeline("automatic-speech-recognition",
33
  )
34
 
35
  # Load the model checkpoint and tokenizer
36
- #model = VitsModel.from_pretrained("Matthijs/mms-tts-fra")
37
- #tokenizer = VitsTokenizer.from_pretrained("Matthijs/mms-tts-fra")
38
- model2 = VitsModel.from_pretrained("facebook/mms-tts-fra")
39
- tokenizer = VitsTokenizer.from_pretrained("facebook/mms-tts-fra")
40
 
41
 
42
  # Define a function to translate an audio, in english here
43
  def translate(audio):
44
- return inference(audio)
45
- # outputs = pipe(audio, max_new_tokens=256,
46
- # generate_kwargs={"task": "transcribe", "language": "english"})
47
- # return outputs["text"]
48
 
49
 
50
  # Define function to generate the waveform output
@@ -70,7 +70,7 @@ def predict(transType, language, audio, audio_mic = None):
70
  print("debug1:", audio,"debug2", audio_mic)
71
  if not audio and audio_mic:
72
  audio = audio_mic
73
-
74
  if transType == "Text":
75
  return translate(audio), None
76
  if transType == "Audio":
@@ -95,7 +95,8 @@ demo = gr.Interface(
95
  inputs=[
96
  gr.Radio(label="Choose your output format", choices=transTypes),
97
  gr.Radio(label="Choose a source language", choices=supportLangs, value="Swedish"),
98
- gr.Audio(label="Import an audio", sources="upload", type="filepath"),
 
99
  gr.Audio(label="Record an audio", sources="microphone", type="filepath"),
100
  ],
101
  outputs=[
 
33
  )
34
 
35
  # Load the model checkpoint and tokenizer
36
+ #model = VitsModel.from_pretrained("Matthijs/mms-tts-eng")
37
+ #tokenizer = VitsTokenizer.from_pretrained("Matthijs/mms-tts-eng")
38
+ model2 = VitsModel.from_pretrained("facebook/mms-tts-eng")
39
+ tokenizer = VitsTokenizer.from_pretrained("facebook/mms-tts-eng")
40
 
41
 
42
  # Define a function to translate an audio, in english here
43
  def translate(audio):
44
+ # return inference(audio)
45
+ outputs = pipe(audio, max_new_tokens=256,
46
+ generate_kwargs={"task": "translate", "language": "swedish"})
47
+ return outputs["text"]
48
 
49
 
50
  # Define function to generate the waveform output
 
70
  print("debug1:", audio,"debug2", audio_mic)
71
  if not audio and audio_mic:
72
  audio = audio_mic
73
+ audio = audio[1]
74
  if transType == "Text":
75
  return translate(audio), None
76
  if transType == "Audio":
 
95
  inputs=[
96
  gr.Radio(label="Choose your output format", choices=transTypes),
97
  gr.Radio(label="Choose a source language", choices=supportLangs, value="Swedish"),
98
+ #gr.Audio(label="Import an audio", sources="upload", type="filepath"),
99
+ gr.Audio(label="Import an audio", sources="upload", type="numpy"),
100
  gr.Audio(label="Record an audio", sources="microphone", type="filepath"),
101
  ],
102
  outputs=[