import os import json import argparse import copy import numpy as np import matplotlib.pyplot as plt import torch import tqdm import librosa import librosa.display import soundfile as sf import pyloudnorm as pyln from dotmap import DotMap import gradio as gr import pytube as pt from pytube.exceptions import VideoUnavailable from utils import mp3_write, normalize from models import load_model_with_args from separate_func import ( conv_tasnet_separate, ) from utils import db2linear def get_audio_from_yt_video(yt_link: str): try: yt = pt.YouTube(yt_link) t = yt.streams.filter(only_audio=True) filename = os.path.join(yt_video_dir, binascii.hexlify(os.urandom(8)).decode() + ".wav") t[0].download(filename=filename) except VideoUnavailable as e: warnings.warn(f"Video Not Found at {yt_link} ({e})") filename = None return filename, filename def inference(file_uploaded_in, file_uploaded_ref): output_wav = None return output_wav with gr.Blocks() as demo: gr.HTML( """

Music Mixing Style Transfer

Hugging Face interactive demo of the paper "Music Mixing Style Transfer: A Contrastive Learning Approach to Disentangle Audio Effects" (ICASSP 2023).
a

""" ) with gr.Group(): with gr.Column(): with gr.Blocks(): with gr.Tab("Input Music"): file_uploaded_in = gr.Audio(label="Input track (mix) to be mixing style transferred", type="filepath") with gr.Tab("YouTube url"): with gr.Row(): yt_link_in = gr.Textbox( label="Enter YouTube Link of the Video", autofocus=True, lines=3 ) yt_btn = gr.Button("Download Audio from YouTube Link", size="lg") yt_audio_path = gr.Audio( label="Input Audio Extracted from the YouTube Video", interactive=False ) yt_btn.click( get_audio_from_yt_video, inputs=[yt_link_in], outputs=[yt_audio_path, file_uploaded_in], ) with gr.Blocks(): with gr.Tab("Reference Music"): file_uploaded_ref = gr.Audio(label="Reference track (mix) to copy mixing style", type="filepath") with gr.Tab("YouTube url"): with gr.Row(): yt_link_ref = gr.Textbox( label="Enter YouTube Link of the Video", autofocus=True, lines=3 ) yt_btn = gr.Button("Download Audio from YouTube Link", size="lg") yt_audio_path = gr.Audio( label="Reference Audio Extracted from the YouTube Video", interactive=False ) yt_btn.click( get_audio_from_yt_video, inputs=[yt_link_ref], outputs=[yt_audio_path, file_uploaded_ref], ) with gr.Group(): gr.HTML( """

Mixing Style Transferred Output.

""" ) # with gr.Row().style(mobile_collapse=False, equal_height=True): with gr.Row(): output_mix = gr.File(label="Download style transferred music track") generate_btn.click( inference, inputs=[file_uploaded_in, file_uploaded_ref], outputs=[wav_output], ) if __name__ == "__main__": demo.launch(debug=True)