lauraibnz commited on
Commit
5a472ab
1 Parent(s): 4f3a930

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -4
app.py CHANGED
@@ -64,9 +64,13 @@ with gr.Blocks(title="🎹 MIDI-AudioLDM", theme=gr.themes.Base(text_size=gr.the
64
  """)
65
  with gr.Column(variant='panel'):
66
  midi = gr.File(label="midi file", file_types=[".mid"])
67
- midi_synth = gr.Audio(label="synthesized midi")
68
- midi.upload(synthesize, midi, midi_synth)
69
  prompt = gr.Textbox(label="prompt", info="Enter a descriptive text prompt to guide the audio generation.")
 
 
 
 
 
 
70
  with gr.Accordion("Advanced Settings", open=False):
71
  duration = gr.Slider(0, 30, value=10, step=2.5, label="duration", info="Modify the duration in seconds of the output audio file.")
72
  inf = gr.Slider(0, 50, value=20, step=1, label="inference steps", info="Edit the number of denoising steps. A larger number usually leads to higher quality but slower results.")
@@ -75,8 +79,6 @@ with gr.Blocks(title="🎹 MIDI-AudioLDM", theme=gr.themes.Base(text_size=gr.the
75
  seed = gr.Number(value=25, label="random seed", info="Change the random seed for a different generation result.")
76
  cond = gr.Slider(0.0, 1.0, value=1.0, step=0.1, label="conditioning scale", info="Choose a value between 0 and 1. The larger the more it will take the conditioning into account. Lower values are recommended for more creative prompts.")
77
  guess = gr.Checkbox(label="guess mode", info="Optionally select guess mode. If so, the model will try to recognize the content of the MIDI without the need of a text prompt.")
78
- with gr.Column(variant='panel'):
79
- audio = gr.Audio(label="generated audio")
80
  btn = gr.Button("Generate")
81
  btn.click(predict, inputs=[midi, prompt, neg_prompt, duration, seed, cond, inf, guidance_scale, guess], outputs=[audio])
82
  gr.Examples(examples=[["S00.mid", "piano", "", 10, 25, 1.0, 20, 2.5, False], ["S00.mid", "violin", "", 10, 25, 1.0, 20, 2.5, False], ["S00.mid", "woman singing, studio recording", "noise", 10, 25, 1.0, 20, 2.5, False], ["S00.mid", "jazz band, clean", "noise", 10, 25, 0.8, 20, 2.5, False], ["S00.mid", "choir", "noise, percussion", 10, 25, 0.7, 20, 2.5, False]], inputs=[midi, prompt, neg_prompt, duration, seed, cond, inf, guidance_scale, guess], fn=run_example, outputs=[midi_synth, audio], cache_examples=True)
 
64
  """)
65
  with gr.Column(variant='panel'):
66
  midi = gr.File(label="midi file", file_types=[".mid"])
 
 
67
  prompt = gr.Textbox(label="prompt", info="Enter a descriptive text prompt to guide the audio generation.")
68
+ with gr.Row():
69
+ with gr.Column():
70
+ midi_synth = gr.Audio(label="synthesized midi")
71
+ midi.upload(synthesize, midi, midi_synth)
72
+ with gr.Column():
73
+ audio = gr.Audio(label="generated audio")
74
  with gr.Accordion("Advanced Settings", open=False):
75
  duration = gr.Slider(0, 30, value=10, step=2.5, label="duration", info="Modify the duration in seconds of the output audio file.")
76
  inf = gr.Slider(0, 50, value=20, step=1, label="inference steps", info="Edit the number of denoising steps. A larger number usually leads to higher quality but slower results.")
 
79
  seed = gr.Number(value=25, label="random seed", info="Change the random seed for a different generation result.")
80
  cond = gr.Slider(0.0, 1.0, value=1.0, step=0.1, label="conditioning scale", info="Choose a value between 0 and 1. The larger the more it will take the conditioning into account. Lower values are recommended for more creative prompts.")
81
  guess = gr.Checkbox(label="guess mode", info="Optionally select guess mode. If so, the model will try to recognize the content of the MIDI without the need of a text prompt.")
 
 
82
  btn = gr.Button("Generate")
83
  btn.click(predict, inputs=[midi, prompt, neg_prompt, duration, seed, cond, inf, guidance_scale, guess], outputs=[audio])
84
  gr.Examples(examples=[["S00.mid", "piano", "", 10, 25, 1.0, 20, 2.5, False], ["S00.mid", "violin", "", 10, 25, 1.0, 20, 2.5, False], ["S00.mid", "woman singing, studio recording", "noise", 10, 25, 1.0, 20, 2.5, False], ["S00.mid", "jazz band, clean", "noise", 10, 25, 0.8, 20, 2.5, False], ["S00.mid", "choir", "noise, percussion", 10, 25, 0.7, 20, 2.5, False]], inputs=[midi, prompt, neg_prompt, duration, seed, cond, inf, guidance_scale, guess], fn=run_example, outputs=[midi_synth, audio], cache_examples=True)