Spaces:

SohomToom
/

TextToVoiceUsingOpenVoice

Running

SohomToom commited on 1 day ago

Commit

b1aa671

verified ·

1 Parent(s): 472f8db

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -36,6 +36,22 @@ def clone_and_speak(text, speaker_wav):
     if not speaker_wav:
         return "Please upload a reference .wav file."
     base_name = f"output_{int(time.time())}_{uuid.uuid4().hex[:6]}"
     tmp_melo_path = f"{output_dir}/{base_name}_tmp.wav"
     final_output_path = f"{output_dir}/{base_name}_converted.wav"

     if not speaker_wav:
         return "Please upload a reference .wav file."
+    import melo.text.english as english
+    original_g2p = english.g2p
+    def patched_g2p(text):
+        phones, tones, word2ph = original_g2p(text)
+        # Fix: wrap ints in list to avoid TypeError
+        word2ph_fixed = []
+        for item in word2ph:
+            if isinstance(item, int):
+                word2ph_fixed.append([item])
+            else:
+                word2ph_fixed.append(item)
+        return phones, tones, word2ph_fixed
+    english.g2p = patched_g2p
     base_name = f"output_{int(time.time())}_{uuid.uuid4().hex[:6]}"
     tmp_melo_path = f"{output_dir}/{base_name}_tmp.wav"
     final_output_path = f"{output_dir}/{base_name}_converted.wav"