from tts_voice import tts_order_voice import edge_tts import gradio as gr import tempfile import anyio import ffmpeg language_dict = tts_order_voice async def text_to_speech_edge(text, language_code): voice = language_dict[language_code] communicate = edge_tts.Communicate(text, voice) with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file: tmp_path = tmp_file.name await communicate.save(tmp_path) new_temp_path = tmp_path.replace(".mp3", ".wav") ( ffmpeg.input(tmp_path) .output(new_temp_path) .run() ) return new_temp_path input_text = gr.inputs.Textbox(lines=5, label="輸入文本") output_audio = gr.outputs.Audio(type="filepath", label="導出文件") default_language = list(language_dict.keys())[287] language = gr.inputs.Dropdown(choices=list(language_dict.keys()), default=default_language, label="語言") interface = gr.Interface(fn=text_to_speech_edge, inputs=[input_text, language], outputs=[output_audio], title="Edge TTS 文字轉語音") if __name__ == "__main__": anyio.run(interface.launch, backend="asyncio")