Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -178,10 +178,18 @@ def generate_audio_from_image(image):
|
|
178 |
# Transpose to (samples, channels) for stereo
|
179 |
generated_audio = generated_audio.T
|
180 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
181 |
# Return the audio and the sample rate (ensure sample rate is an integer)
|
182 |
return generated_audio, int(sample_rate)
|
183 |
|
184 |
|
|
|
185 |
# Gradio Interface
|
186 |
def main():
|
187 |
global generator # Declare the generator object globally
|
|
|
178 |
# Transpose to (samples, channels) for stereo
|
179 |
generated_audio = generated_audio.T
|
180 |
|
181 |
+
# Ensure that the audio is a 2D array (for stereo)
|
182 |
+
if generated_audio.ndim == 1:
|
183 |
+
generated_audio = np.expand_dims(generated_audio, axis=-1) # Add channel dimension for mono
|
184 |
+
|
185 |
+
# Debug: Print the shape and type of the generated audio
|
186 |
+
print(f"Generated audio shape after processing: {generated_audio.shape}, type: {generated_audio.dtype}")
|
187 |
+
|
188 |
# Return the audio and the sample rate (ensure sample rate is an integer)
|
189 |
return generated_audio, int(sample_rate)
|
190 |
|
191 |
|
192 |
+
|
193 |
# Gradio Interface
|
194 |
def main():
|
195 |
global generator # Declare the generator object globally
|