SheldonYC commited on
Commit
6560c3d
1 Parent(s): 70ae40c

update asr model

Browse files
Files changed (3) hide show
  1. app.py +6 -6
  2. packages.txt +2 -0
  3. requirements.txt +3 -1
app.py CHANGED
@@ -1,8 +1,8 @@
1
- import os
2
- os.system("""
3
- apt-get update && apt-get install -y libsndfile1 ffmpeg
4
- pip install Cython
5
- pip install nemo_toolkit['all']""")
6
 
7
  import nemo.collections.asr as nemo_asr
8
  from transformers import pipeline
@@ -22,7 +22,7 @@ def transcribe(audio):
22
  resampled_audio = librosa.resample(y=y.astype("float"), orig_sr=sr, target_sr=16000)
23
  write(audio_name, 16000, resampled_audio)
24
  result = asr_model.transcribe([f"./{audio_name}"])
25
- return result
26
 
27
  asr_model = nemo_asr.models.EncDecCTCModel.from_pretrained(model_name="nvidia/parakeet-ctc-0.6b")
28
 
 
1
+ # import os
2
+ # os.system("""
3
+ # apt-get update && apt-get install -y libsndfile1 ffmpeg
4
+ # pip install Cython
5
+ # pip install nemo_toolkit['all']""")
6
 
7
  import nemo.collections.asr as nemo_asr
8
  from transformers import pipeline
 
22
  resampled_audio = librosa.resample(y=y.astype("float"), orig_sr=sr, target_sr=16000)
23
  write(audio_name, 16000, resampled_audio)
24
  result = asr_model.transcribe([f"./{audio_name}"])
25
+ return result[0]
26
 
27
  asr_model = nemo_asr.models.EncDecCTCModel.from_pretrained(model_name="nvidia/parakeet-ctc-0.6b")
28
 
packages.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ libsndfile1
2
+ ffmpeg
requirements.txt CHANGED
@@ -2,4 +2,6 @@ torch
2
  transformers
3
  numpy
4
  librosa
5
- scipy
 
 
 
2
  transformers
3
  numpy
4
  librosa
5
+ scipy
6
+ Cython
7
+ "nemo_toolkit['all']"