renatotn7 commited on
Commit
ca52925
1 Parent(s): 9fc089f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -34,7 +34,7 @@ if 'processor' not in locals():
34
  #text = st.text_area('entre com algum texto')
35
  #st.title("Wav a ser transcrito ")
36
 
37
- wav_up = st.file_uploader("Upload",type=['wav'])
38
  if wav_up is not None:
39
  file_details = {"FileName":wav_up.name,"FileType":wav_up.type}
40
  st.write(file_details)
@@ -54,7 +54,8 @@ if st.button('Processa'):
54
  # audio,
55
  # language = None
56
  # )
57
- input_features = processor(wav_up.getbuffer() , return_tensors="pt").input_features
 
58
  forced_decoder_ids = processor.get_decoder_prompt_ids(language = None, task = "transcribe")
59
 
60
  predicted_ids = model.generate(input_features, forced_decoder_ids = forced_decoder_ids)
 
34
  #text = st.text_area('entre com algum texto')
35
  #st.title("Wav a ser transcrito ")
36
 
37
+ wav_up = st.file_uploader("Upload",type=['wav','ogg','mp3'])
38
  if wav_up is not None:
39
  file_details = {"FileName":wav_up.name,"FileType":wav_up.type}
40
  st.write(file_details)
 
54
  # audio,
55
  # language = None
56
  # )
57
+ processado=np.frombuffer(wav_up.getbuffer(), np.int16).flatten().astype(np.float32) / 32768.0
58
+ input_features = processor(processado , return_tensors="pt").input_features
59
  forced_decoder_ids = processor.get_decoder_prompt_ids(language = None, task = "transcribe")
60
 
61
  predicted_ids = model.generate(input_features, forced_decoder_ids = forced_decoder_ids)