Voice-Clone-Multilingual

Running

App Files Files Community

Nymbo commited on 4 days ago

Commit

5f6f95d

verified ·

1 Parent(s): e4511d7

Update app.py

Browse files

Files changed (1) hide show

app.py +38 -7

app.py CHANGED Viewed

@@ -7,6 +7,7 @@ if str(APP_ROOT) not in sys.path:
     sys.path.insert(0, str(APP_ROOT))
 import gradio as gr
 import torch
 from TTS.api import TTS
@@ -22,6 +23,31 @@ except ImportError:
             "Failed to build monotonic_align extension; ensure build dependencies are installed."
         ) from exc
 # Get device
 device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -34,12 +60,17 @@ def voice_clone(text: str, speaker_wav: str, language: str):
     tts.tts_to_file(text=text, speaker_wav=speaker_wav, language=language, file_path="output.wav")
     return "output.wav"
-iface = gr.Interface(fn=voice_clone, theme="Nymbo/Nymbo_Theme",
-                     inputs=[gr.Textbox(lines=2, placeholder="Enter the text...", label="Text"),
-                             gr.Audio(type="filepath", label="Upload audio file"),
-                             gr.Radio(['ru', 'en', 'zh-cn', 'ja', 'de', 'fr', 'it', 'pt', 'pl', 'tr', 'ko', 'nl', 'cs', 'ar', 'es', 'hu'], label="language"),
-                            ],
-                     outputs=gr.Audio(type="filepath", label="Generated audio file"),
-                     title="Voice Cloning")
 iface.launch()

     sys.path.insert(0, str(APP_ROOT))
 import gradio as gr
+import gradio_client.utils as grc_utils
 import torch
 from TTS.api import TTS
             "Failed to build monotonic_align extension; ensure build dependencies are installed."
         ) from exc
+# Patch Gradio schema helpers to guard against boolean schemas until upstream fix lands.
+_ORIG_GET_TYPE = getattr(grc_utils, "get_type", None)
+_ORIG_JSON_TO_PY = getattr(grc_utils, "_json_schema_to_python_type", None)
+def _safe_get_type(schema):  # pragma: no cover - runtime patching
+    if isinstance(schema, bool):
+        return "Any" if schema else "Never"
+    if _ORIG_GET_TYPE is None:
+        raise AttributeError("gradio_client.utils.get_type is unavailable")
+    return _ORIG_GET_TYPE(schema)
+def _safe_json_schema_to_python_type(schema, defs=None):  # pragma: no cover
+    if isinstance(schema, bool):
+        return "Any" if schema else "Never"
+    if _ORIG_JSON_TO_PY is None:
+        raise AttributeError("gradio_client.utils._json_schema_to_python_type is unavailable")
+    return _ORIG_JSON_TO_PY(schema, defs)
+if _ORIG_GET_TYPE is not None:
+    grc_utils.get_type = _safe_get_type
+if _ORIG_JSON_TO_PY is not None:
+    grc_utils._json_schema_to_python_type = _safe_json_schema_to_python_type
 # Get device
 device = "cuda" if torch.cuda.is_available() else "cpu"
     tts.tts_to_file(text=text, speaker_wav=speaker_wav, language=language, file_path="output.wav")
     return "output.wav"
+iface = gr.Interface(
+    fn=voice_clone,
+    theme="Nymbo/Nymbo_Theme",
+    inputs=[
+        gr.Textbox(lines=2, placeholder="Enter the text...", label="Text"),
+        gr.Audio(type="filepath", label="Upload audio file"),
+        gr.Radio(['ru', 'en', 'zh-cn', 'ja', 'de', 'fr', 'it', 'pt', 'pl', 'tr', 'ko', 'nl', 'cs', 'ar', 'es', 'hu'], label="language"),
+    ],
+    outputs=gr.Audio(type="filepath", label="Generated audio file"),
+    title="Voice Cloning",
+    allow_flagging="never",
+)
 iface.launch()