Diana-Bert-VITS2

Running

App Files Files Community

CrawfordZhou commited on Jan 17

Commit

2b7b812

•

1 Parent(s): c23d5e4

Update app.py

Browse files

添加情景语言模式+一些样式调整

Files changed (1) hide show

app.py +17 -15

app.py CHANGED Viewed

@@ -63,10 +63,9 @@ def get_text(text, language_str, hps):
     return bert, phone, tone, language
-def infer(text, key, sdp_ratio, noise_scale, noise_scale_w, length_scale, sid):
     global net_g
-    message = gpt_35_api(key, text)
-    print(message)
     bert, phones, tones, lang_ids = get_text(message, "ZH", hps)
     with torch.no_grad():
         x_tst=phones.to(device).unsqueeze(0)
@@ -81,10 +80,11 @@ def infer(text, key, sdp_ratio, noise_scale, noise_scale_w, length_scale, sid):
         del x_tst, tones, lang_ids, bert, x_tst_lengths, speakers
         return audio
-def tts_fn(text, key, speaker, sdp_ratio, noise_scale, noise_scale_w, length_scale):
     with torch.no_grad():
-        audio = infer(text, key, sdp_ratio=sdp_ratio, noise_scale=noise_scale, noise_scale_w=noise_scale_w, length_scale=length_scale, sid=speaker)
-    return "Success", (hps.data.sampling_rate, audio)
 if __name__ == "__main__":
@@ -127,11 +127,10 @@ if __name__ == "__main__":
         with gr.Row():
             with gr.Column():
                 gr.Markdown(value="""
-                【AI嘉然】在线语音对话版（Bert-Vits2 + gpt）\n
-                （注：转发生成可能较慢，请等待大约2分钟哦！）\n
-                音声作者：Xz乔希 https://space.bilibili.com/5859321\n
-                集成gpt作者：碎语碎念 https://space.bilibili.com/4269384\n
-                声音归属：嘉然今天吃什么 https://space.bilibili.com/672328094\n
                 Bert-VITS2项目：https://github.com/Stardust-minus/Bert-VITS2\n
                 GPT_API_free项目：https://github.com/chatanywhere/GPT_API_free\n
                 本项目中的apiKey可以从https://github.com/chatanywhere/GPT_API_free\n
@@ -141,7 +140,9 @@ if __name__ == "__main__":
                 """)
                 text = gr.TextArea(label="Text", placeholder="Input Text Here",
                                       value="虚拟主播是什么？")
-                key = gr.TextArea(label="GPT Key", placeholder="请输入上面提示中获取的gpt key",
                                    value="izlrijShDu7tp2rIgvYfibcC2J0Eh3uWfdm9ndrxN5nWrL96")
                 speaker = gr.Dropdown(choices=speakers, value=speakers[0], label='Speaker')
                 sdp_ratio = gr.Slider(minimum=0.1, maximum=1, value=0.2, step=0.01, label='SDP/DP混合比')
@@ -151,10 +152,11 @@ if __name__ == "__main__":
                 btn = gr.Button("点击生成", variant="primary")
             with gr.Column():
                 text_output = gr.Textbox(label="Message")
-                audio_output = gr.Audio(label="Output Audio")
         btn.click(tts_fn,
-                inputs=[text, key, speaker, sdp_ratio, noise_scale, noise_scale_w, length_scale],
-                outputs=[text_output, audio_output])
 #    webbrowser.open("http://127.0.0.1:6006")
 #    app.launch(server_port=6006, show_error=True)

     return bert, phone, tone, language
+def infer(text, sdp_ratio, noise_scale, noise_scale_w, length_scale, sid):
     global net_g
+    print(text)
     bert, phones, tones, lang_ids = get_text(message, "ZH", hps)
     with torch.no_grad():
         x_tst=phones.to(device).unsqueeze(0)
         del x_tst, tones, lang_ids, bert, x_tst_lengths, speakers
         return audio
+def tts_fn(text, font, key, speaker, sdp_ratio, noise_scale, noise_scale_w, length_scale):
+    message = gpt_35_api(key, font + text)
     with torch.no_grad():
+        audio = infer(message, sdp_ratio=sdp_ratio, noise_scale=noise_scale, noise_scale_w=noise_scale_w, length_scale=length_scale, sid=speaker)
+    return "Success", (hps.data.sampling_rate, message, audio)
 if __name__ == "__main__":
         with gr.Row():
             with gr.Column():
                 gr.Markdown(value="""
+                #【AI嘉然】在线语音对话版（Bert-Vits2 + gpt）\n
+                ![avatar](https://img2.baidu.com/it/u=624370534,740039074&fm=253&fmt=auto&app=138&f=JPEG?w=200&h=300) \n
+                （注：转发生成可能较慢，请等待大约2分钟哦，目前只支持中文语言的答案，其他语言的支持在开发中捏！）\n
+                作者：[Xz乔希](https://space.bilibili.com/5859321) & [碎语碎念](https://space.bilibili.com/4269384) 声音归属：[嘉然今天吃什么](https://space.bilibili.com/672328094) \n
                 Bert-VITS2项目：https://github.com/Stardust-minus/Bert-VITS2\n
                 GPT_API_free项目：https://github.com/chatanywhere/GPT_API_free\n
                 本项目中的apiKey可以从https://github.com/chatanywhere/GPT_API_free\n
                 """)
                 text = gr.TextArea(label="Text", placeholder="Input Text Here",
                                       value="虚拟主播是什么？")
+                front_text = gr.TextArea(label="请输入情景语言", placeholder="请输入情景语言",
+                              value="你是一个叫嘉然的虚拟主播，")
+                key = gr.Text(label="GPT Key(过期请更换)", placeholder="请输入上面提示中获取的gpt key",
                                    value="izlrijShDu7tp2rIgvYfibcC2J0Eh3uWfdm9ndrxN5nWrL96")
                 speaker = gr.Dropdown(choices=speakers, value=speakers[0], label='Speaker')
                 sdp_ratio = gr.Slider(minimum=0.1, maximum=1, value=0.2, step=0.01, label='SDP/DP混合比')
                 btn = gr.Button("点击生成", variant="primary")
             with gr.Column():
                 text_output = gr.Textbox(label="Message")
+                gpt_output = gr.TextArea(label="嘉然老师的文字回答")
+                audio_output = gr.Audio(label="嘉然老师的语音回答")
         btn.click(tts_fn,
+                inputs=[text, front_text, key, speaker, sdp_ratio, noise_scale, noise_scale_w, length_scale],
+                outputs=[text_output, gpt_output, audio_output])
 #    webbrowser.open("http://127.0.0.1:6006")
 #    app.launch(server_port=6006, show_error=True)