Spaces:
Running
Running
Update
Browse files
app.py
CHANGED
@@ -28,6 +28,11 @@ models_paths = {
|
|
28 |
"el-GR": "jonatasgrosman/wav2vec2-large-xlsr-53-greek",
|
29 |
}
|
30 |
|
|
|
|
|
|
|
|
|
|
|
31 |
# Classifier Intent
|
32 |
model_name = 'qanastek/XLMRoberta-Alexa-Intents-Classification'
|
33 |
tokenizer_intent = AutoTokenizer.from_pretrained(model_name)
|
@@ -53,11 +58,6 @@ examples = [[e, e.split("=")[0].split("/")[-1]] for e in examples]
|
|
53 |
def transcribe(audio_path, lang_code):
|
54 |
|
55 |
speech_array, sampling_rate = librosa.load(audio_path, sr=16_000)
|
56 |
-
|
57 |
-
if lang_code not in models:
|
58 |
-
models[lang_code] = {}
|
59 |
-
models[lang_code]["processor"] = Wav2Vec2Processor.from_pretrained(models_paths[lang_code])
|
60 |
-
models[lang_code]["model"] = Wav2Vec2ForCTC.from_pretrained(models_paths[lang_code])
|
61 |
|
62 |
# Load model
|
63 |
processor_asr = models[lang_code]["processor"]
|
@@ -94,6 +94,11 @@ def getUniform(text):
|
|
94 |
|
95 |
|
96 |
def predict(wav_file, lang_code):
|
|
|
|
|
|
|
|
|
|
|
97 |
|
98 |
text = transcribe(wav_file, lang_code).replace("apizza","a pizza")
|
99 |
|
|
|
28 |
"el-GR": "jonatasgrosman/wav2vec2-large-xlsr-53-greek",
|
29 |
}
|
30 |
|
31 |
+
for lang_code in models_paths.keys():
|
32 |
+
models[lang_code] = {}
|
33 |
+
models[lang_code]["processor"] = Wav2Vec2Processor.from_pretrained(models_paths[lang_code])
|
34 |
+
models[lang_code]["model"] = Wav2Vec2ForCTC.from_pretrained(models_paths[lang_code])
|
35 |
+
|
36 |
# Classifier Intent
|
37 |
model_name = 'qanastek/XLMRoberta-Alexa-Intents-Classification'
|
38 |
tokenizer_intent = AutoTokenizer.from_pretrained(model_name)
|
|
|
58 |
def transcribe(audio_path, lang_code):
|
59 |
|
60 |
speech_array, sampling_rate = librosa.load(audio_path, sr=16_000)
|
|
|
|
|
|
|
|
|
|
|
61 |
|
62 |
# Load model
|
63 |
processor_asr = models[lang_code]["processor"]
|
|
|
94 |
|
95 |
|
96 |
def predict(wav_file, lang_code):
|
97 |
+
|
98 |
+
if lang_code not in models_paths.keys():
|
99 |
+
return {
|
100 |
+
"The language code is unknown!"
|
101 |
+
}
|
102 |
|
103 |
text = transcribe(wav_file, lang_code).replace("apizza","a pizza")
|
104 |
|