Spaces:

robinhad
/

ukrainian-tts

Running

ukrainian-tts / app.py

Yurii Paniv

Add female voice in multispeaker model

8812d27 over 2 years ago

4.46 kB

	import tempfile

	import gradio as gr

	from TTS.utils.synthesizer import Synthesizer
	import requests
	from os.path import exists
	from formatter import preprocess_text
	from datetime import datetime
	from enum import Enum
	import torch


	class StressOption(Enum):
	ManualStress = "Наголоси вручну"
	AutomaticStress = "Автоматичні наголоси (Beta)"


	class VoiceOption(Enum):
	MaleVoice = "Микита (чоловічий)"
	FemaleVoice = "Олена (жіночий)"


	def download(url, file_name):
	if not exists(file_name):
	print(f"Downloading {file_name}")
	r = requests.get(url, allow_redirects=True)
	with open(file_name, "wb") as file:
	file.write(r.content)
	else:
	print(f"Found {file_name}. Skipping download...")


	print("downloading uk/mykyta/vits-tts")
	release_number = "v2.0.0"
	model_link = f"https://github.com/robinhad/ukrainian-tts/releases/download/{release_number}/model-inference.pth"
	config_link = f"https://github.com/robinhad/ukrainian-tts/releases/download/{release_number}/config.json"
	speakers_link = f"https://github.com/robinhad/ukrainian-tts/releases/download/{release_number}/speakers.pth"

	model_path = "model.pth"
	config_path = "config.json"
	speakers_path = "speakers.pth"

	download(model_link, model_path)
	download(config_link, config_path)
	download(speakers_link, speakers_path)

	badge = (
	"https://visitor-badge-reloaded.herokuapp.com/badge?page_id=robinhad.ukrainian-tts"
	)

	synthesizer = Synthesizer(
	model_path,
	config_path,
	speakers_path,
	None,
	None,
	)

	if synthesizer is None:
	raise NameError("model not found")


	def tts(text: str, voice: str, stress: str):
	print("============================")
	print("Original text:", text)
	print("Voice", voice)
	print("Stress:", stress)
	print("Time:", datetime.utcnow())
	autostress = True if stress == StressOption.AutomaticStress.value else False
	speaker_name = "male1" if voice == VoiceOption.MaleVoice.value else "female3"
	text = preprocess_text(text, autostress)
	text_limit = 1200
	text = (
	text if len(text) < text_limit else text[0:text_limit]
	) # mitigate crashes on hf space
	print("Converted:", text)

	with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
	with torch.no_grad():
	wavs = synthesizer.tts(text, speaker_name=speaker_name)
	synthesizer.save_wav(wavs, fp)
	return fp.name, text


	iface = gr.Interface(
	fn=tts,
	inputs=[
	gr.inputs.Textbox(
	label="Input",
	default="Введ+іть, б+удь л+аска, сво+є р+ечення.",
	),
	gr.inputs.Radio(
	label="Голос",
	choices=[option.value for option in VoiceOption],
	),
	gr.inputs.Radio(
	label="Наголоси",
	choices=[option.value for option in StressOption],
	),
	],
	outputs=[
	gr.outputs.Audio(label="Output"),
	gr.outputs.Textbox(label="Наголошений текст"),
	],
	title="🐸💬🇺🇦 - Coqui TTS",
	theme="huggingface",
	description="Україномовний🇺🇦 TTS за допомогою Coqui TTS (для наголосу використовуйте + перед голосною)",
	article="Якщо вам подобається, підтримайте за посиланням: [SUPPORT LINK](https://send.monobank.ua/jar/48iHq4xAXm), "
	+ "Github: [https://github.com/robinhad/ukrainian-tts](https://github.com/robinhad/ukrainian-tts)"
	+ f'<center><img src="{badge}" alt="visitors badge"/></center>',
	examples=[
	["Введ+іть, б+удь л+аска, сво+є р+ечення.", VoiceOption.FemaleVoice.value, StressOption.ManualStress.value],
	["Введ+іть, б+удь л+аска, сво+є р+ечення.", VoiceOption.MaleVoice.value, StressOption.ManualStress.value],
	["Введіть, будь ласка, своє речення.", VoiceOption.MaleVoice.value, StressOption.ManualStress.value],
	["Привіт, як тебе звати?", VoiceOption.FemaleVoice.value, StressOption.AutomaticStress.value],
	["Договір підписано 4 квітня 1949 року.", VoiceOption.FemaleVoice.value, StressOption.AutomaticStress.value],
	],
	)
	iface.launch(enable_queue=True, prevent_thread_lock=True)