Spaces:
Running
on
Zero
Running
on
Zero
import gradio as gr | |
from musiclib import musicgen | |
from io import BytesIO | |
import midi_util | |
from midi_util import VocabConfig | |
import tempfile | |
from glob import glob | |
import soundfile as sf | |
from midi2audio import FluidSynth | |
fs = FluidSynth() | |
def gen(piano_only, length): | |
midi = '' | |
for item in musicgen(piano_only=piano_only, length=length): | |
midi = item | |
yield item, None, None | |
bio = BytesIO() | |
cfg = VocabConfig.from_json('./vocab_config.json') | |
text = midi.strip() | |
mid = midi_util.convert_str_to_midi(cfg, text) | |
with tempfile.NamedTemporaryFile(suffix='.midi', delete=False) as tmp, tempfile.NamedTemporaryFile(suffix='.wav', delete=False) as aud: | |
mid.save(tmp.name) | |
fs.midi_to_audio(tmp.name, aud.name) | |
yield midi, tmp.name, aud.name | |
with gr.Blocks() as demo: | |
gr.Markdown("# RWKV 4 Music (MIDI)\n\nThis demo uses the RWKV 4 MIDI model available [here](https://huggingface.co/BlinkDL/rwkv-4-music/blob/main/RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth). Details may be found [here](https://huggingface.co/BlinkDL/rwkv-4-music). The music generation code may be found [here](https://github.com/BlinkDL/ChatRWKV/tree/main/music). The MIDI Tokenizer may be found [here](https://github.com/briansemrau/MIDI-LLM-tokenizer).\n\nNot sure how to play MIDI files? I recommend using the open source [VLC Media Player](https://www.videolan.org/vlc/) with can play MIDI files using FluidSynth.") | |
piano_only = gr.Checkbox(label="Piano Only") | |
length = gr.Slider(label="Max Length (in tokens)", minimum=4, maximum=4096, step=1, value=4096, info="The audio may still be shorter than this") | |
synth = gr.Button("Synthesize") | |
txtout = gr.Textbox(interactive=False, label="MIDI Tokens") | |
fileout = gr.File(interactive=False, label="MIDI File", type="binary") | |
audioout = gr.Audio(interactive=False, label="Audio") | |
synth.click(gen, inputs=[piano_only, length], outputs=[txtout, fileout, audioout]) | |
with gr.Accordion("Samples", open=False): | |
for i, audpath in enumerate(glob("*.wav")): | |
sr, dat = sf.read(audpath) | |
gr.Audio(interactive=False, value=(sr,dat,), label=f'Sample {i + 1}') | |
demo.queue(api_open=False).launch(show_api=False) |