Merlintxu commited on
Commit
1851c8f
1 Parent(s): df609a3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -6
app.py CHANGED
@@ -12,7 +12,6 @@ from transformers import logging
12
  warnings.filterwarnings("ignore")
13
  logging.set_verbosity_error()
14
 
15
-
16
  # Updated models by language
17
  MODELS = {
18
  "es": [
@@ -23,7 +22,7 @@ MODELS = {
23
  "en": [
24
  "openai/whisper-large-v3",
25
  "facebook/wav2vec2-large-960h",
26
- "microsoft/wav2vec2-base-960"
27
  ],
28
  "pt": [
29
  "facebook/wav2vec2-large-xlsr-53-portuguese",
@@ -103,18 +102,18 @@ def combined_interface(audio):
103
  language, model_options = detect_and_select_model(audio)
104
  selected_model = model_options[0]
105
 
106
- yield language, gr.Dropdown.update(choices=model_options, value=selected_model), selected_model, ""
107
 
108
  full_transcription = ""
109
  for partial_transcription in transcribe_audio_stream(audio, selected_model):
110
  full_transcription += partial_transcription + " "
111
- yield language, gr.Dropdown.update(choices=model_options, value=selected_model), selected_model, full_transcription.strip()
112
 
113
  # Clean up temporary files
114
  os.remove("converted_audio.wav")
115
 
116
  except Exception as e:
117
- yield str(e), gr.Dropdown.update(choices=[]), "", "An error occurred during processing."
118
 
119
  iface = gr.Interface(
120
  fn=combined_interface,
@@ -126,7 +125,7 @@ iface = gr.Interface(
126
  gr.Textbox(label="Transcription", lines=10)
127
  ],
128
  title="Multilingual Audio Transcriber with Real-time Display",
129
- description="Upload an audio file to detect the language, select the transcription model, and get the transcription in real-time. Optimized for Spanish and English.",
130
  live=True
131
  )
132
 
 
12
  warnings.filterwarnings("ignore")
13
  logging.set_verbosity_error()
14
 
 
15
  # Updated models by language
16
  MODELS = {
17
  "es": [
 
22
  "en": [
23
  "openai/whisper-large-v3",
24
  "facebook/wav2vec2-large-960h",
25
+ "microsoft/wav2vec2-base-960h"
26
  ],
27
  "pt": [
28
  "facebook/wav2vec2-large-xlsr-53-portuguese",
 
102
  language, model_options = detect_and_select_model(audio)
103
  selected_model = model_options[0]
104
 
105
+ yield language, model_options, selected_model, ""
106
 
107
  full_transcription = ""
108
  for partial_transcription in transcribe_audio_stream(audio, selected_model):
109
  full_transcription += partial_transcription + " "
110
+ yield language, model_options, selected_model, full_transcription.strip()
111
 
112
  # Clean up temporary files
113
  os.remove("converted_audio.wav")
114
 
115
  except Exception as e:
116
+ yield str(e), [], "", "An error occurred during processing."
117
 
118
  iface = gr.Interface(
119
  fn=combined_interface,
 
125
  gr.Textbox(label="Transcription", lines=10)
126
  ],
127
  title="Multilingual Audio Transcriber with Real-time Display",
128
+ description="Upload an audio file to detect the language, select the transcription model, and get the transcription in real-time. Optimized for Spanish, English, and Portuguese.",
129
  live=True
130
  )
131