Spaces:
Runtime error
Runtime error
jaekookang
commited on
Commit
•
5058a94
1
Parent(s):
48d2b64
updated audio reading module
Browse files
gradio_asr_en_libri100_word_vs_bpe.py
CHANGED
@@ -8,7 +8,9 @@ import os
|
|
8 |
from difflib import Differ
|
9 |
from glob import glob
|
10 |
from loguru import logger
|
11 |
-
import librosa
|
|
|
|
|
12 |
import gradio as gr
|
13 |
|
14 |
from espnet2.bin.asr_inference import Speech2Text
|
@@ -43,7 +45,11 @@ logger.info('model loaded')
|
|
43 |
def predict(wav_file):
|
44 |
logger.info('wav file loaded')
|
45 |
# Load audio
|
46 |
-
speech, rate = librosa.load(wav_file, sr=16000)
|
|
|
|
|
|
|
|
|
47 |
# Run inference
|
48 |
W = model_word(speech)[0]
|
49 |
B = model_bpe(speech)[0]
|
|
|
8 |
from difflib import Differ
|
9 |
from glob import glob
|
10 |
from loguru import logger
|
11 |
+
# import librosa
|
12 |
+
from scipy.io import wavfile
|
13 |
+
import scipy.signal as sps
|
14 |
import gradio as gr
|
15 |
|
16 |
from espnet2.bin.asr_inference import Speech2Text
|
|
|
45 |
def predict(wav_file):
|
46 |
logger.info('wav file loaded')
|
47 |
# Load audio
|
48 |
+
# speech, rate = librosa.load(wav_file, sr=16000)
|
49 |
+
rate, speech_raw = wavfile.read(wav_file)
|
50 |
+
number_of_samples = round(len(speech_raw) * float(16000) / rate)
|
51 |
+
speech = sps.resample(speech_raw, number_of_samples)
|
52 |
+
|
53 |
# Run inference
|
54 |
W = model_word(speech)[0]
|
55 |
B = model_bpe(speech)[0]
|
requirements.txt
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
espnet==0.10.6
|
2 |
espnet_model_zoo==0.1.7
|
3 |
-
gradio
|
4 |
loguru==0.6.0
|
5 |
librosa
|
6 |
soundfile
|
|
|
1 |
espnet==0.10.6
|
2 |
espnet_model_zoo==0.1.7
|
3 |
+
gradio
|
4 |
loguru==0.6.0
|
5 |
librosa
|
6 |
soundfile
|