Spaces:

r3gm
/

rvc_zero

Running on Zero

App Files Files Community

Vgjkmhf commited on Oct 14

Commit

ab6aa32

verified ·

1 Parent(s): 54f012e

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -38

app.py CHANGED Viewed

@@ -66,7 +66,7 @@ for url, filename in zip(test_model.split(", "), test_names):
 title = "<center><strong><font size='7'>RVC⚡ZERO</font></strong></center>"
 description = "This demo is provided for educational and research purposes only. The authors and contributors of this project do not endorse or encourage any misuse or unethical use of this software. Any use of this software for purposes other than those intended is solely at the user's own risk. The authors and contributors shall not be held responsible for any damages or liabilities arising from the use of this demo inappropriately." if IS_ZERO_GPU else ""
-RESOURCES = "- You can also try `RVC⚡ZERO` in Colab’s free tier, which provides free GPU [link](https://github.com/R3gm/rvc_zero_ui?tab=readme-ov-file#rvczero)."
 theme = args.theme
 delete_cache_time = (3200, 3200) if IS_ZERO_GPU else (86400, 86400)
@@ -367,7 +367,7 @@ def run(
     steps,
 ):
     if not audio_files:
-        raise ValueError("The audio pls")
     if isinstance(audio_files, str):
         audio_files = [audio_files]
@@ -411,7 +411,7 @@ def run(
 def audio_conf():
     return gr.File(
-        label="Audio files",
         file_count="multiple",
         type="filepath",
         container=True,
@@ -420,9 +420,10 @@ def audio_conf():
 def model_conf():
     return gr.File(
-        label="Model file",
         type="filepath",
         height=130,
     )
@@ -430,7 +431,7 @@ def pitch_algo_conf():
     return gr.Dropdown(
         PITCH_ALGO_OPT,
         value=PITCH_ALGO_OPT[4],
-        label="Pitch algorithm",
         visible=True,
         interactive=True,
     )
@@ -438,7 +439,7 @@ def pitch_algo_conf():
 def pitch_lvl_conf():
     return gr.Slider(
-        label="Pitch level",
         minimum=-24,
         maximum=24,
         step=1,
@@ -450,9 +451,10 @@ def pitch_lvl_conf():
 def index_conf():
     return gr.File(
-        label="Index file",
         type="filepath",
         height=130,
     )
@@ -460,7 +462,7 @@ def index_inf_conf():
     return gr.Slider(
         minimum=0,
         maximum=1,
-        label="Index influence",
         value=0.75,
     )
@@ -469,7 +471,7 @@ def respiration_filter_conf():
     return gr.Slider(
         minimum=0,
         maximum=7,
-        label="Respiration median filtering",
         value=3,
         step=1,
         interactive=True,
@@ -480,7 +482,7 @@ def envelope_ratio_conf():
     return gr.Slider(
         minimum=0,
         maximum=1,
-        label="Envelope ratio",
         value=0.25,
         interactive=True,
     )
@@ -490,7 +492,7 @@ def consonant_protec_conf():
     return gr.Slider(
         minimum=0,
         maximum=0.5,
-        label="Consonant breath protection",
         value=0.5,
         interactive=True,
     )
@@ -498,14 +500,14 @@ def consonant_protec_conf():
 def button_conf():
     return gr.Button(
-        "Inference",
         variant="primary",
     )
 def output_conf():
     return gr.File(
-        label="Result",
         file_count="multiple",
         interactive=False,
     )
@@ -514,15 +516,14 @@ def output_conf():
 def active_tts_conf():
     return gr.Checkbox(
         False,
-        label="TTS",
-        # info="",
         container=False,
     )
 def tts_voice_conf():
     return gr.Dropdown(
-        label="tts voice",
         choices=voices,
         visible=False,
         value="en-US-EmmaMultilingualNeural-Female",
@@ -532,8 +533,8 @@ def tts_voice_conf():
 def tts_text_conf():
     return gr.Textbox(
         value="",
-        placeholder="Write the text here...",
-        label="Text",
         visible=False,
         lines=3,
     )
@@ -541,7 +542,7 @@ def tts_text_conf():
 def tts_button_conf():
     return gr.Button(
-        "Process TTS",
         variant="secondary",
         visible=False,
     )
@@ -550,8 +551,7 @@ def tts_button_conf():
 def tts_play_conf():
     return gr.Checkbox(
         False,
-        label="Play",
-        # info="",
         container=False,
         visible=False,
     )
@@ -561,7 +561,6 @@ def sound_gui():
     return gr.Audio(
         value=None,
         type="filepath",
-        # format="mp3",
         autoplay=True,
         visible=True,
         interactive=False,
@@ -573,7 +572,7 @@ def steps_conf():
     return gr.Slider(
         minimum=1,
         maximum=3,
-        label="Steps",
         value=1,
         step=1,
         interactive=True,
@@ -582,7 +581,7 @@ def steps_conf():
 def format_output_gui():
     return gr.Dropdown(
-        label="Format output:",
         choices=["wav", "mp3", "flac"],
         value="wav",
     )
@@ -590,8 +589,7 @@ def format_output_gui():
 def denoise_conf():
     return gr.Checkbox(
         False,
-        label="Denoise",
-        # info="",
         container=False,
         visible=True,
     )
@@ -600,8 +598,7 @@ def denoise_conf():
 def effects_conf():
     return gr.Checkbox(
         False,
-        label="Reverb",
-        # info="",
         container=False,
         visible=True,
     )
@@ -636,8 +633,7 @@ def show_components_tts(value_active):
 def down_active_conf():
     return gr.Checkbox(
         False,
-        label="URL-to-Model",
-        # info="",
         container=False,
     )
@@ -645,8 +641,8 @@ def down_active_conf():
 def down_url_conf():
     return gr.Textbox(
         value="",
-        placeholder="Write the url here...",
-        label="Enter URL",
         visible=False,
         lines=1,
     )
@@ -654,7 +650,7 @@ def down_url_conf():
 def down_button_conf():
     return gr.Button(
-        "Process",
         variant="secondary",
         visible=False,
     )
@@ -671,7 +667,7 @@ def show_components_down(value_active):
 CSS = """
 #audio_tts {
-  visibility: hidden;   /* invisible but still takes space */
   height: 0px;
   width: 0px;
   max-width: 0px;
@@ -705,7 +701,6 @@ def get_gui(theme):
         )
         aud = audio_conf()
-        # gr.HTML("<hr>")
         tts_button.click(
             fn=infer_tts_audio,
@@ -713,9 +708,12 @@ def get_gui(theme):
             outputs=[aud, tts_play],
         )
         down_active_gui = down_active_conf()
         down_info = gr.Markdown(
-            f"Provide a link to a zip file, like this one: `https://huggingface.co/MrDawg/ToothBrushing/resolve/main/ToothBrushing.zip?download=true`, or separate links with a comma for the .pth and .index files, like this: `{test_model}`",
             visible=False
         )
         with gr.Row():
@@ -741,7 +739,7 @@ def get_gui(theme):
             [model, indx]
         )
-        with gr.Accordion(label="Advanced settings", open=False):
             algo = pitch_algo_conf()
             algo_lvl = pitch_lvl_conf()
             indx_inf = index_inf_conf()
@@ -853,4 +851,4 @@ if __name__ == "__main__":
         quiet=False,
         debug=IS_COLAB,
         ssr_mode=False,
-    )

 title = "<center><strong><font size='7'>RVC⚡ZERO</font></strong></center>"
 description = "This demo is provided for educational and research purposes only. The authors and contributors of this project do not endorse or encourage any misuse or unethical use of this software. Any use of this software for purposes other than those intended is solely at the user's own risk. The authors and contributors shall not be held responsible for any damages or liabilities arising from the use of this demo inappropriately." if IS_ZERO_GPU else ""
+RESOURCES = "- You can also try `RVC⚡ZERO` in Colab's free tier, which provides free GPU [link](https://github.com/R3gm/rvc_zero_ui?tab=readme-ov-file#rvczero)."
 theme = args.theme
 delete_cache_time = (3200, 3200) if IS_ZERO_GPU else (86400, 86400)
     steps,
 ):
     if not audio_files:
+        raise ValueError("لطفا فایل صوتی آپلود کنید")
     if isinstance(audio_files, str):
         audio_files = [audio_files]
 def audio_conf():
     return gr.File(
+        label="فایل‌های صوتی",
         file_count="multiple",
         type="filepath",
         container=True,
 def model_conf():
     return gr.File(
+        label="آپلود مدل (.pth)",
         type="filepath",
         height=130,
+        file_types=[".pth"],
     )
     return gr.Dropdown(
         PITCH_ALGO_OPT,
         value=PITCH_ALGO_OPT[4],
+        label="الگوریتم پیچ",
         visible=True,
         interactive=True,
     )
 def pitch_lvl_conf():
     return gr.Slider(
+        label="سطح پیچ",
         minimum=-24,
         maximum=24,
         step=1,
 def index_conf():
     return gr.File(
+        label="آپلود فایل ایندکس (.index) - اختیاری",
         type="filepath",
         height=130,
+        file_types=[".index"],
     )
     return gr.Slider(
         minimum=0,
         maximum=1,
+        label="تاثیر ایندکس",
         value=0.75,
     )
     return gr.Slider(
         minimum=0,
         maximum=7,
+        label="فیلتر میانه تنفس",
         value=3,
         step=1,
         interactive=True,
     return gr.Slider(
         minimum=0,
         maximum=1,
+        label="نسبت پوششی",
         value=0.25,
         interactive=True,
     )
     return gr.Slider(
         minimum=0,
         maximum=0.5,
+        label="محافظت تنفس صامت",
         value=0.5,
         interactive=True,
     )
 def button_conf():
     return gr.Button(
+        "اجرای تبدیل صدا",
         variant="primary",
     )
 def output_conf():
     return gr.File(
+        label="نتیجه",
         file_count="multiple",
         interactive=False,
     )
 def active_tts_conf():
     return gr.Checkbox(
         False,
+        label="فعال‌سازی TTS",
         container=False,
     )
 def tts_voice_conf():
     return gr.Dropdown(
+        label="صدای TTS",
         choices=voices,
         visible=False,
         value="en-US-EmmaMultilingualNeural-Female",
 def tts_text_conf():
     return gr.Textbox(
         value="",
+        placeholder="متن خود را اینجا بنویسید...",
+        label="متن",
         visible=False,
         lines=3,
     )
 def tts_button_conf():
     return gr.Button(
+        "تولید TTS",
         variant="secondary",
         visible=False,
     )
 def tts_play_conf():
     return gr.Checkbox(
         False,
+        label="پخش",
         container=False,
         visible=False,
     )
     return gr.Audio(
         value=None,
         type="filepath",
         autoplay=True,
         visible=True,
         interactive=False,
     return gr.Slider(
         minimum=1,
         maximum=3,
+        label="تعداد مراحل",
         value=1,
         step=1,
         interactive=True,
 def format_output_gui():
     return gr.Dropdown(
+        label="فرمت خروجی:",
         choices=["wav", "mp3", "flac"],
         value="wav",
     )
 def denoise_conf():
     return gr.Checkbox(
         False,
+        label="حذف نویز",
         container=False,
         visible=True,
     )
 def effects_conf():
     return gr.Checkbox(
         False,
+        label="افکت‌های صوتی (Reverb)",
         container=False,
         visible=True,
     )
 def down_active_conf():
     return gr.Checkbox(
         False,
+        label="دانلود مدل از URL",
         container=False,
     )
 def down_url_conf():
     return gr.Textbox(
         value="",
+        placeholder="آدرس URL را اینجا وارد کنید...",
+        label="وارد کردن URL",
         visible=False,
         lines=1,
     )
 def down_button_conf():
     return gr.Button(
+        "دانلود مدل",
         variant="secondary",
         visible=False,
     )
 CSS = """
 #audio_tts {
+  visibility: hidden;
   height: 0px;
   width: 0px;
   max-width: 0px;
         )
         aud = audio_conf()
         tts_button.click(
             fn=infer_tts_audio,
             outputs=[aud, tts_play],
         )
+        gr.Markdown("### 📁 آپلود مدل")
+        gr.Markdown("می‌توانید فایل مدل .pth و فایل ایندکس .index را مستقیما آپلود کنید یا از URL دانلود کنید")
         down_active_gui = down_active_conf()
         down_info = gr.Markdown(
+            f"لینک فایل zip مانند: `https://huggingface.co/MrDawg/ToothBrushing/resolve/main/ToothBrushing.zip?download=true` یا لینک‌های جدا شده با کاما برای فایل‌های .pth و .index مانند: `{test_model}`",
             visible=False
         )
         with gr.Row():
             [model, indx]
         )
+        with gr.Accordion(label="تنظیمات پیشرفته", open=False):
             algo = pitch_algo_conf()
             algo_lvl = pitch_lvl_conf()
             indx_inf = index_inf_conf()
         quiet=False,
         debug=IS_COLAB,
         ssr_mode=False,
+    )