jaekookang commited on
Commit
5058a94
1 Parent(s): 48d2b64

updated audio reading module

Browse files
gradio_asr_en_libri100_word_vs_bpe.py CHANGED
@@ -8,7 +8,9 @@ import os
8
  from difflib import Differ
9
  from glob import glob
10
  from loguru import logger
11
- import librosa
 
 
12
  import gradio as gr
13
 
14
  from espnet2.bin.asr_inference import Speech2Text
@@ -43,7 +45,11 @@ logger.info('model loaded')
43
  def predict(wav_file):
44
  logger.info('wav file loaded')
45
  # Load audio
46
- speech, rate = librosa.load(wav_file, sr=16000)
 
 
 
 
47
  # Run inference
48
  W = model_word(speech)[0]
49
  B = model_bpe(speech)[0]
 
8
  from difflib import Differ
9
  from glob import glob
10
  from loguru import logger
11
+ # import librosa
12
+ from scipy.io import wavfile
13
+ import scipy.signal as sps
14
  import gradio as gr
15
 
16
  from espnet2.bin.asr_inference import Speech2Text
 
45
  def predict(wav_file):
46
  logger.info('wav file loaded')
47
  # Load audio
48
+ # speech, rate = librosa.load(wav_file, sr=16000)
49
+ rate, speech_raw = wavfile.read(wav_file)
50
+ number_of_samples = round(len(speech_raw) * float(16000) / rate)
51
+ speech = sps.resample(speech_raw, number_of_samples)
52
+
53
  # Run inference
54
  W = model_word(speech)[0]
55
  B = model_bpe(speech)[0]
requirements.txt CHANGED
@@ -1,6 +1,6 @@
1
  espnet==0.10.6
2
  espnet_model_zoo==0.1.7
3
- gradio==2.7.5.2
4
  loguru==0.6.0
5
  librosa
6
  soundfile
 
1
  espnet==0.10.6
2
  espnet_model_zoo==0.1.7
3
+ gradio
4
  loguru==0.6.0
5
  librosa
6
  soundfile