JacobLinCool commited on
Commit
3123dc8
1 Parent(s): c212706

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +59 -0
app.py ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from gradio_client import Client, handle_file
3
+ from zerorvc import RVC
4
+ import soundfile as sf
5
+ from pydub import AudioSegment
6
+ from joblib import memory
7
+
8
+ memory = memory.Memory(location="cache", verbose=0)
9
+
10
+ rvc = RVC.from_pretrained(MODEL_NAME)
11
+
12
+ @memory.cache(ignore=["client"])
13
+ def split(client, audio):
14
+ result = client.predict(
15
+ param_0=handle_file(audio),
16
+ param_1="BS-RoFormer",
17
+ api_name="/separate"
18
+ )
19
+ return result[0], result[1]
20
+
21
+ def process_audio(client, audio, pitch_modification):
22
+ vocal, bgm = split(client, audio)
23
+ samples = rvc.convert(vocal, pitch_modification=pitch_modification)
24
+
25
+ sf.write("vocal.wav", samples, rvc.sr)
26
+
27
+ vocal = AudioSegment.from_wav("vocal.wav")
28
+ background = AudioSegment.from_mp3(bgm)
29
+
30
+ combined = background.overlay(vocal)
31
+ combined.export("combined.mp3", format="mp3")
32
+ return "combined.mp3", "vocal.wav", bgm
33
+
34
+ iface = gr.Interface(
35
+ fn=process_audio,
36
+ inputs=[gr.Audio(type="filepath"), gr.Slider(minimum=-36, maximum=36, value=0, step=1)],
37
+ outputs=[gr.Audio(label="Combined"), gr.Audio(label="Vocal"), gr.Audio(label="Background")],
38
+ title="Voice Conversion",
39
+ description="Upload an audio file and process it.",
40
+ )
41
+
42
+
43
+ def set_client_for_session(request: gr.Request):
44
+ x_ip_token = request.headers['x-ip-token']
45
+ return Client("JacobLinCool/vocal-separation", headers={"X-IP-Token": x_ip_token})
46
+
47
+ with gr.Blocks() as demo:
48
+ client = gr.State()
49
+ btn = gr.Button("Run", variant="primary")
50
+
51
+ btn.submit(
52
+ process_audio,
53
+ [client, gr.Audio(type="filepath"), gr.Slider(minimum=-36, maximum=36, value=0, step=1)],
54
+ [gr.Audio(label="Combined"), gr.Audio(label="Vocal"), gr.Audio(label="Background")]
55
+ )
56
+
57
+ demo.load(set_client_for_session, None, client)
58
+
59
+ demo.launch()