Mel_2_Wav / app.py
nakas's picture
Update app.py
a443433
import gradio as gr
import numpy as np
import librosa
from scipy.io.wavfile import write
# import the librosa library for converting a Mel spectrogram image to audio
def mel_to_audio(mel_spectrogram):
# convert the Mel spectrogram image to a grayscale image to avoid the string indices must be integers error
# convert the Mel spectrogram image to audio using librosa
# specify the data type of the output array to avoid the same_kind casting error
audio = librosa.feature.inverse.mel_to_audio(mel_spectrogram, dtype=np.float64)
# Save the audio to a file
output = 'output.wav'
sample = 44100
print (output)
write(output, sample, audio.astype(np.float64))
return output
# create the gradio app
app = gr.Interface(mel_to_audio, "image", "audio")
app.launch()