rwkv-music / app.py
mrfakename's picture
Update app.py
14cc068 verified
raw
history blame
2.23 kB
import gradio as gr
from musiclib import musicgen
from io import BytesIO
import midi_util
from midi_util import VocabConfig
import tempfile
from glob import glob
import soundfile as sf
from midi2audio import FluidSynth
fs = FluidSynth()
def gen(piano_only, length):
midi = ''
for item in musicgen(piano_only=piano_only, length=length):
midi = item
yield item, None, None
bio = BytesIO()
cfg = VocabConfig.from_json('./vocab_config.json')
text = midi.strip()
mid = midi_util.convert_str_to_midi(cfg, text)
with tempfile.NamedTemporaryFile(suffix='.midi', delete=False) as tmp, tempfile.NamedTemporaryFile(suffix='.wav', delete=False) as aud:
mid.save(tmp.name)
fs.midi_to_audio(tmp.name, aud.name)
yield midi, tmp.name, aud.name
with gr.Blocks() as demo:
gr.Markdown("# RWKV 4 Music (MIDI)\n\nThis demo uses the RWKV 4 MIDI model available [here](https://huggingface.co/BlinkDL/rwkv-4-music/blob/main/RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth). Details may be found [here](https://huggingface.co/BlinkDL/rwkv-4-music). The music generation code may be found [here](https://github.com/BlinkDL/ChatRWKV/tree/main/music). The MIDI Tokenizer may be found [here](https://github.com/briansemrau/MIDI-LLM-tokenizer).\n\nNot sure how to play MIDI files? I recommend using the open source [VLC Media Player](https://www.videolan.org/vlc/) with can play MIDI files using FluidSynth.")
piano_only = gr.Checkbox(label="Piano Only")
length = gr.Slider(label="Max Length (in tokens)", minimum=4, maximum=4096, step=1, value=4096, info="The audio may still be shorter than this")
synth = gr.Button("Synthesize")
txtout = gr.Textbox(interactive=False, label="MIDI Tokens")
fileout = gr.File(interactive=False, label="MIDI File", type="binary")
audioout = gr.Audio(interactive=False, label="Audio")
synth.click(gen, inputs=[piano_only, length], outputs=[txtout, fileout, audioout])
with gr.Accordion("Samples", open=False):
for i, audpath in enumerate(glob("*.wav")):
sr, dat = sf.read(audpath)
gr.Audio(interactive=False, value=(sr,dat,), label=f'Sample {i + 1}')
demo.queue(api_open=False).launch(show_api=False)