qanastek commited on
Commit
2bc0b29
β€’
1 Parent(s): 535f2ec
Files changed (1) hide show
  1. app.py +10 -5
app.py CHANGED
@@ -28,6 +28,11 @@ models_paths = {
28
  "el-GR": "jonatasgrosman/wav2vec2-large-xlsr-53-greek",
29
  }
30
 
 
 
 
 
 
31
  # Classifier Intent
32
  model_name = 'qanastek/XLMRoberta-Alexa-Intents-Classification'
33
  tokenizer_intent = AutoTokenizer.from_pretrained(model_name)
@@ -53,11 +58,6 @@ examples = [[e, e.split("=")[0].split("/")[-1]] for e in examples]
53
  def transcribe(audio_path, lang_code):
54
 
55
  speech_array, sampling_rate = librosa.load(audio_path, sr=16_000)
56
-
57
- if lang_code not in models:
58
- models[lang_code] = {}
59
- models[lang_code]["processor"] = Wav2Vec2Processor.from_pretrained(models_paths[lang_code])
60
- models[lang_code]["model"] = Wav2Vec2ForCTC.from_pretrained(models_paths[lang_code])
61
 
62
  # Load model
63
  processor_asr = models[lang_code]["processor"]
@@ -94,6 +94,11 @@ def getUniform(text):
94
 
95
 
96
  def predict(wav_file, lang_code):
 
 
 
 
 
97
 
98
  text = transcribe(wav_file, lang_code).replace("apizza","a pizza")
99
 
 
28
  "el-GR": "jonatasgrosman/wav2vec2-large-xlsr-53-greek",
29
  }
30
 
31
+ for lang_code in models_paths.keys():
32
+ models[lang_code] = {}
33
+ models[lang_code]["processor"] = Wav2Vec2Processor.from_pretrained(models_paths[lang_code])
34
+ models[lang_code]["model"] = Wav2Vec2ForCTC.from_pretrained(models_paths[lang_code])
35
+
36
  # Classifier Intent
37
  model_name = 'qanastek/XLMRoberta-Alexa-Intents-Classification'
38
  tokenizer_intent = AutoTokenizer.from_pretrained(model_name)
 
58
  def transcribe(audio_path, lang_code):
59
 
60
  speech_array, sampling_rate = librosa.load(audio_path, sr=16_000)
 
 
 
 
 
61
 
62
  # Load model
63
  processor_asr = models[lang_code]["processor"]
 
94
 
95
 
96
  def predict(wav_file, lang_code):
97
+
98
+ if lang_code not in models_paths.keys():
99
+ return {
100
+ "The language code is unknown!"
101
+ }
102
 
103
  text = transcribe(wav_file, lang_code).replace("apizza","a pizza")
104