Update app.py
Browse files
app.py
CHANGED
@@ -36,21 +36,21 @@ def clone_and_speak(text, speaker_wav):
|
|
36 |
if not speaker_wav:
|
37 |
return "Please upload a reference .wav file."
|
38 |
|
39 |
-
import melo.text.english as english
|
40 |
-
original_g2p = english.g2p
|
41 |
|
42 |
-
def patched_g2p(text):
|
43 |
-
|
44 |
-
|
45 |
-
|
46 |
-
|
47 |
-
|
48 |
-
|
49 |
-
|
50 |
-
|
51 |
-
|
52 |
|
53 |
-
english.g2p = patched_g2p
|
54 |
|
55 |
base_name = f"output_{int(time.time())}_{uuid.uuid4().hex[:6]}"
|
56 |
tmp_melo_path = f"{output_dir}/{base_name}_tmp.wav"
|
@@ -62,7 +62,7 @@ def clone_and_speak(text, speaker_wav):
|
|
62 |
default_speaker_id = next(iter(speaker_ids.values()))
|
63 |
|
64 |
# Generate base TTS voice
|
65 |
-
model.tts_to_file(text, default_speaker_id, tmp_melo_path,"1.0")
|
66 |
|
67 |
# Use speaker_wav as reference to extract style embedding
|
68 |
from openvoice import se_extractor
|
|
|
36 |
if not speaker_wav:
|
37 |
return "Please upload a reference .wav file."
|
38 |
|
39 |
+
# import melo.text.english as english
|
40 |
+
# original_g2p = english.g2p
|
41 |
|
42 |
+
# def patched_g2p(text):
|
43 |
+
# phones, tones, word2ph = original_g2p(text)
|
44 |
+
# # Fix: wrap ints in list to avoid TypeError
|
45 |
+
# word2ph_fixed = []
|
46 |
+
# for item in word2ph:
|
47 |
+
# if isinstance(item, int):
|
48 |
+
# word2ph_fixed.append([item])
|
49 |
+
# else:
|
50 |
+
# word2ph_fixed.append(item)
|
51 |
+
# return phones, tones, word2ph_fixed
|
52 |
|
53 |
+
# english.g2p = patched_g2p
|
54 |
|
55 |
base_name = f"output_{int(time.time())}_{uuid.uuid4().hex[:6]}"
|
56 |
tmp_melo_path = f"{output_dir}/{base_name}_tmp.wav"
|
|
|
62 |
default_speaker_id = next(iter(speaker_ids.values()))
|
63 |
|
64 |
# Generate base TTS voice
|
65 |
+
model.tts_to_file(text, default_speaker_id, tmp_melo_path,speed="1.0")
|
66 |
|
67 |
# Use speaker_wav as reference to extract style embedding
|
68 |
from openvoice import se_extractor
|