Spaces:

musdfakoc
/

local_intelligence

Sleeping

musdfakoc commited on Sep 30, 2024

Commit

6deab9e

verified ·

1 Parent(s): 3e00b11

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -178,10 +178,18 @@ def generate_audio_from_image(image):
     # Transpose to (samples, channels) for stereo
     generated_audio = generated_audio.T
     # Return the audio and the sample rate (ensure sample rate is an integer)
     return generated_audio, int(sample_rate)
 # Gradio Interface
 def main():
     global generator  # Declare the generator object globally

     # Transpose to (samples, channels) for stereo
     generated_audio = generated_audio.T
+    # Ensure that the audio is a 2D array (for stereo)
+    if generated_audio.ndim == 1:
+        generated_audio = np.expand_dims(generated_audio, axis=-1)  # Add channel dimension for mono
+    # Debug: Print the shape and type of the generated audio
+    print(f"Generated audio shape after processing: {generated_audio.shape}, type: {generated_audio.dtype}")
     # Return the audio and the sample rate (ensure sample rate is an integer)
     return generated_audio, int(sample_rate)
 # Gradio Interface
 def main():
     global generator  # Declare the generator object globally