SohomToom commited on
Commit
a854620
·
verified ·
1 Parent(s): 925b582

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -14
app.py CHANGED
@@ -36,21 +36,21 @@ def clone_and_speak(text, speaker_wav):
36
  if not speaker_wav:
37
  return "Please upload a reference .wav file."
38
 
39
- import melo.text.english as english
40
- original_g2p = english.g2p
41
 
42
- def patched_g2p(text):
43
- phones, tones, word2ph = original_g2p(text)
44
- # Fix: wrap ints in list to avoid TypeError
45
- word2ph_fixed = []
46
- for item in word2ph:
47
- if isinstance(item, int):
48
- word2ph_fixed.append([item])
49
- else:
50
- word2ph_fixed.append(item)
51
- return phones, tones, word2ph_fixed
52
 
53
- english.g2p = patched_g2p
54
 
55
  base_name = f"output_{int(time.time())}_{uuid.uuid4().hex[:6]}"
56
  tmp_melo_path = f"{output_dir}/{base_name}_tmp.wav"
@@ -62,7 +62,7 @@ def clone_and_speak(text, speaker_wav):
62
  default_speaker_id = next(iter(speaker_ids.values()))
63
 
64
  # Generate base TTS voice
65
- model.tts_to_file(text, default_speaker_id, tmp_melo_path,"1.0")
66
 
67
  # Use speaker_wav as reference to extract style embedding
68
  from openvoice import se_extractor
 
36
  if not speaker_wav:
37
  return "Please upload a reference .wav file."
38
 
39
+ # import melo.text.english as english
40
+ # original_g2p = english.g2p
41
 
42
+ # def patched_g2p(text):
43
+ # phones, tones, word2ph = original_g2p(text)
44
+ # # Fix: wrap ints in list to avoid TypeError
45
+ # word2ph_fixed = []
46
+ # for item in word2ph:
47
+ # if isinstance(item, int):
48
+ # word2ph_fixed.append([item])
49
+ # else:
50
+ # word2ph_fixed.append(item)
51
+ # return phones, tones, word2ph_fixed
52
 
53
+ # english.g2p = patched_g2p
54
 
55
  base_name = f"output_{int(time.time())}_{uuid.uuid4().hex[:6]}"
56
  tmp_melo_path = f"{output_dir}/{base_name}_tmp.wav"
 
62
  default_speaker_id = next(iter(speaker_ids.values()))
63
 
64
  # Generate base TTS voice
65
+ model.tts_to_file(text, default_speaker_id, tmp_melo_path,speed="1.0")
66
 
67
  # Use speaker_wav as reference to extract style embedding
68
  from openvoice import se_extractor