Spaces:

Baghdad99
/

ha-en

Sleeping

Baghdad99 commited on Dec 20, 2023

Commit

47453aa

•

1 Parent(s): 952235c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -21,8 +21,14 @@ def translate_speech(audio_data_tuple):
     # Print the shape and type of the audio data
     print(f"Audio data type: {type(audio_data)}, Audio data shape: {audio_data.shape}")
     # Use the speech recognition pipeline to transcribe the audio
-    output = pipe(audio_data.astype(np.float64))  # Convert to Double
     print(f"Output: {output}")  # Print the output to see what it contains

     # Print the shape and type of the audio data
     print(f"Audio data type: {type(audio_data)}, Audio data shape: {audio_data.shape}")
+    # Normalize the audio data to the range [-1, 1]
+    audio_data_normalized = audio_data / np.iinfo(audio_data.dtype).max
+    # Convert the normalized audio data to float64
+    audio_data_float64 = audio_data_normalized.astype(np.float64)
     # Use the speech recognition pipeline to transcribe the audio
+    output = pipe(audio_data_float64)
     print(f"Output: {output}")  # Print the output to see what it contains