Spaces:

kevinwang676
/

OpenVoice

Running

App Files Files Community

kevinwang676 commited on Dec 28, 2023

Commit

39ccbcc

•

1 Parent(s): 7a2bce5

Update app.py

Browse files

Files changed (1) hide show

app.py +41 -1

app.py CHANGED Viewed

@@ -15,6 +15,14 @@ base_speaker_tts.load_ckpt(f'{ckpt_base_en}/checkpoint.pth')
 tone_color_converter = ToneColorConverter(f'{ckpt_converter_en}/config.json', device=device)
 tone_color_converter.load_ckpt(f'{ckpt_converter_en}/checkpoint.pth')
 from tts_voice import tts_order_voice
 import edge_tts
 import gradio as gr
@@ -63,6 +71,26 @@ def vc_en(text, audio_ref, style_mode):
   return "output.wav"
 language_dict = tts_order_voice
 base_speaker = "base_audio.mp3"
@@ -109,11 +137,23 @@ with app:
       with gr.Column():
         out1 = gr.Audio(label="为您合成的专属语音", type="filepath")
     btn1.click(vc_en, [inp1, inp2, inp3], out1)
   with gr.Tab("🌟多语言声音复刻"):
     with gr.Row():
       with gr.Column():
-        inp4 = gr.Textbox(lines=3, label="请输入您想转换的英文文本")
         inp5 = gr.Audio(label="请上传您喜欢的语音文件", type="filepath")
         inp6 = gr.Dropdown(choices=list(language_dict.keys()), value=list(language_dict.keys())[15], label="请选择文本对应的语言")

 tone_color_converter = ToneColorConverter(f'{ckpt_converter_en}/config.json', device=device)
 tone_color_converter.load_ckpt(f'{ckpt_converter_en}/checkpoint.pth')
+ckpt_base_zh = 'checkpoints/checkpoints/base_speakers/ZH'
+base_speaker_tts_zh = BaseSpeakerTTS(f'{ckpt_base_zh}/config.json', device=device)
+base_speaker_tts_zh.load_ckpt(f'{ckpt_base_zh}/checkpoint.pth')
+source_se = torch.load(f'{ckpt_base}/zh_default_se.pth').to(device)
+save_path = f'{output_dir}/output_chinese.wav'
 from tts_voice import tts_order_voice
 import edge_tts
 import gradio as gr
   return "output.wav"
+def vc_zh(text, audio_ref):
+    source_se = torch.load(f'{ckpt_base}/zh_default_se.pth').to(device)
+    save_path = "output.wav"
+    src_path = "tmp.wav"
+    base_speaker_tts.tts(text, src_path, speaker='default', language='Chinese', speed=1.0)
+    reference_speaker = audio_ref
+    target_se, audio_name = se_extractor.get_se(reference_speaker, tone_color_converter, target_dir='processed', vad=True)
+    # Run the tone color converter
+    encode_message = "@MyShell"
+    tone_color_converter.convert(
+        audio_src_path=src_path,
+        src_se=source_se,
+        tgt_se=target_se,
+        output_path=save_path,
+        message=encode_message)
+    return "output.wav"
 language_dict = tts_order_voice
 base_speaker = "base_audio.mp3"
       with gr.Column():
         out1 = gr.Audio(label="为您合成的专属语音", type="filepath")
     btn1.click(vc_en, [inp1, inp2, inp3], out1)
+  with gr.Tab("🎶中文声音复刻"):
+    with gr.Row():
+      with gr.Column():
+        inp_zh_1 = gr.Textbox(lines=3, label="请输入您想转换的中文文本")
+        inp_zh_2 = gr.Audio(label="请上传您喜欢的语音文件", type="filepath")
+        btn_zh = gr.Button("开始语音情感真实复刻吧！", variant="primary")
+      with gr.Column():
+        out_zh = gr.Audio(label="为您合成的专属语音", type="filepath")
+    btn_zh.click(vc_zh, [inp_zh_1, inp_zh_2], out_zh)
   with gr.Tab("🌟多语言声音复刻"):
     with gr.Row():
       with gr.Column():
+        inp4 = gr.Textbox(lines=3, label="请输入您想转换的任意语言文本")
         inp5 = gr.Audio(label="请上传您喜欢的语音文件", type="filepath")
         inp6 = gr.Dropdown(choices=list(language_dict.keys()), value=list(language_dict.keys())[15], label="请选择文本对应的语言")