roman commited on
Commit
7d4b95e
·
1 Parent(s): 7a12d83

audio_input fix

Browse files
Files changed (1) hide show
  1. app.py +3 -0
app.py CHANGED
@@ -58,6 +58,9 @@ if uploaded_file is not None:
58
  audio_input = AudioSegment.from_file(temp_wav_path).set_frame_rate(16000).set_channels(1)
59
  audio_input = np.array(audio_input.get_array_of_samples())
60
 
 
 
 
61
  # Process the audio
62
  input_features = processor(audio_input, return_tensors="pt", sampling_rate=16000).input_values
63
 
 
58
  audio_input = AudioSegment.from_file(temp_wav_path).set_frame_rate(16000).set_channels(1)
59
  audio_input = np.array(audio_input.get_array_of_samples())
60
 
61
+ # Normalize audio
62
+ audio_input = (audio_input - np.mean(audio_input)) / np.std(audio_input)
63
+
64
  # Process the audio
65
  input_features = processor(audio_input, return_tensors="pt", sampling_rate=16000).input_values
66