Spaces:

jhtonyKoo
/

ITO-Master

Running

App Files Files Community

jhtonyKoo commited on Oct 21

Commit

e32542e

•

1 Parent(s): e43ae33

add examples

Browse files

Files changed (1) hide show

app.py +24 -12

app.py CHANGED Viewed

@@ -173,22 +173,26 @@ with gr.Blocks() as demo:
         gr.Markdown("Interactive demo of Inference Time Optimization (ITO) for Music Mastering Style Transfer. \
                     The mastering style transfer is performed by a differentiable audio processing model, and the predicted parameters are shown as the output. \
                     Perform mastering style transfer with an input source audio and a reference mastering style audio. On top of this result, you can perform ITO to optimize the reference embedding $z_{ref}$ to further gain control over the output mastering style.")
-        gr.Image("ito_snow.png", width=100, label="ITO pipeline")
     gr.Markdown("## Step 1: Mastering Style Transfer")
     with gr.Tab("Upload Audio"):
         with gr.Row():
-            input_audio = gr.Audio(label="Source Audio $x_{in}$")
-            reference_audio = gr.Audio(label="Reference Style Audio $x_{ref}$")
         # Dropdowns for selecting example files
         with gr.Row():
-            input_example_dropdown = gr.Dropdown(label="Select Input Example", choices=input_examples)
-            reference_example_dropdown = gr.Dropdown(label="Select Reference Example", choices=reference_examples)
         process_button = gr.Button("Process Mastering Style Transfer")
         gr.Markdown('<span style="color: lightgray; font-style: italic;">all output samples are normalized to -12dB</span>')
         with gr.Row():
             with gr.Column():
@@ -196,19 +200,27 @@ with gr.Blocks() as demo:
                 normalized_input = gr.Audio(label="Normalized Source Audio", type='numpy')
             param_output = gr.Textbox(label="Predicted Parameters", lines=5)
-        def process_audio_with_examples(input_audio, reference_audio, input_example, reference_example):
-            if input_example:
-                input_audio = sf.read(os.path.join(EXAMPLES_DIR, input_example))[0]
-            if reference_example:
-                reference_audio = sf.read(os.path.join(EXAMPLES_DIR, reference_example))[0]
             return process_audio(input_audio, reference_audio)
         process_button.click(
             process_audio_with_examples,
-            inputs=[input_audio, reference_audio, input_example_dropdown, reference_example_dropdown],
             outputs=[output_audio, param_output, normalized_input]
         )
     with gr.Tab("YouTube Audio"):
         with gr.Row():
             input_youtube_url = gr.Textbox(label="Input YouTube URL")

         gr.Markdown("Interactive demo of Inference Time Optimization (ITO) for Music Mastering Style Transfer. \
                     The mastering style transfer is performed by a differentiable audio processing model, and the predicted parameters are shown as the output. \
                     Perform mastering style transfer with an input source audio and a reference mastering style audio. On top of this result, you can perform ITO to optimize the reference embedding $z_{ref}$ to further gain control over the output mastering style.")
+        gr.Image("ito_snow.png", width=300, height=200, label="ITO pipeline")
     gr.Markdown("## Step 1: Mastering Style Transfer")
     with gr.Tab("Upload Audio"):
         with gr.Row():
+            use_example_files = gr.Checkbox(label="Use Example Files", value=False)
+        with gr.Row():
+            input_audio = gr.Audio(label="Source Audio $x_{in}$", interactive=not use_example_files.value)
+            reference_audio = gr.Audio(label="Reference Style Audio $x_{ref}$", interactive=not use_example_files.value)
         # Dropdowns for selecting example files
         with gr.Row():
+            input_example_dropdown = gr.Dropdown(label="Select Input Example", choices=input_examples, interactive=use_example_files.value)
+            reference_example_dropdown = gr.Dropdown(label="Select Reference Example", choices=reference_examples, interactive=use_example_files.value)
         process_button = gr.Button("Process Mastering Style Transfer")
         gr.Markdown('<span style="color: lightgray; font-style: italic;">all output samples are normalized to -12dB</span>')
+        gr.Markdown("all output samples are normalized to -12dB")
         with gr.Row():
             with gr.Column():
                 normalized_input = gr.Audio(label="Normalized Source Audio", type='numpy')
             param_output = gr.Textbox(label="Predicted Parameters", lines=5)
+        def process_audio_with_examples(input_audio, reference_audio, input_example, reference_example, use_examples):
+            if use_examples:
+                if input_example:
+                    input_audio = sf.read(os.path.join(EXAMPLES_DIR, input_example))[0]
+                if reference_example:
+                    reference_audio = sf.read(os.path.join(EXAMPLES_DIR, reference_example))[0]
             return process_audio(input_audio, reference_audio)
         process_button.click(
             process_audio_with_examples,
+            inputs=[input_audio, reference_audio, input_example_dropdown, reference_example_dropdown, use_example_files],
             outputs=[output_audio, param_output, normalized_input]
         )
+        # Update the interactivity of the audio inputs and dropdowns based on the checkbox
+        use_example_files.change(
+            lambda use_examples: (not use_examples, not use_examples),
+            inputs=[use_example_files],
+            outputs=[input_audio, reference_audio]
+        )
     with gr.Tab("YouTube Audio"):
         with gr.Row():
             input_youtube_url = gr.Textbox(label="Input YouTube URL")