Spaces:

phuntshowangdi
/

Automatic_sound_recognition

Sleeping

phuntshowangdi commited on Apr 16

Commit

2330d2b

•

1 Parent(s): 0fd1932

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -32,11 +32,14 @@ def transcribe_audio(audio_file):
             # Read the content of the uploaded file
             audio_content = audio_file.read()
-            # Convert the content to torch tensor with single channel
-            waveform, sample_rate = torchaudio.load(BytesIO(audio_content), channels_first=True)
-            waveform = waveform.mean(dim=0, keepdim=True)  # Downmix stereo to mono
-            # Convert the torch tensor to a numpy array
             waveform_np = waveform.numpy()
             # Transcribe the audio

             # Read the content of the uploaded file
             audio_content = audio_file.read()
+            # Load the audio using torchaudio.load
+            waveform, sample_rate = torchaudio.load(BytesIO(audio_content))
+            # Convert to mono if stereo
+            if waveform.shape[0] > 1:
+                waveform = torch.mean(waveform, dim=0, keepdim=True)
+            # Convert the waveform to numpy array
             waveform_np = waveform.numpy()
             # Transcribe the audio