Spaces:

robinhad
/

ukrainian-tts

Running

ukrainian-tts / app.py

Yurii Paniv

Release 3.0.0

3502c7a over 1 year ago

No virus

4.84 kB

	import tempfile

	import gradio as gr

	from TTS.utils.synthesizer import Synthesizer
	import requests
	from os.path import exists
	from formatter import preprocess_text
	from datetime import datetime
	from enum import Enum
	import torch


	class StressOption(Enum):
	AutomaticStress = "Автоматичні наголоси (за словником) 📖"
	AutomaticStressWithModel = "Автоматичні наголоси (за допомогою моделі) 🧮"


	class VoiceOption(Enum):
	Olena = "Олена (жіночий) 👩"
	Mykyta = "Микита (чоловічий) 👨"
	Lada = "Лада (жіночий) 👩"


	def download(url, file_name):
	if not exists(file_name):
	print(f"Downloading {file_name}")
	r = requests.get(url, allow_redirects=True)
	with open(file_name, "wb") as file:
	file.write(r.content)
	else:
	print(f"Found {file_name}. Skipping download...")


	print("downloading uk/mykyta/vits-tts")
	release_number = "v3.0.0-alpha"
	model_link = f"https://github.com/robinhad/ukrainian-tts/releases/download/{release_number}/model-inference.pth"
	config_link = f"https://github.com/robinhad/ukrainian-tts/releases/download/{release_number}/config.json"
	speakers_link = f"https://github.com/robinhad/ukrainian-tts/releases/download/{release_number}/speakers.pth"

	model_path = "model.pth"
	config_path = "config.json"
	speakers_path = "speakers.pth"

	download(model_link, model_path)
	download(config_link, config_path)
	download(speakers_link, speakers_path)

	badge = (
	"https://visitor-badge-reloaded.herokuapp.com/badge?page_id=robinhad.ukrainian-tts"
	)

	synthesizer = Synthesizer(
	model_path,
	config_path,
	speakers_path,
	None,
	None,
	)

	if synthesizer is None:
	raise NameError("model not found")


	def tts(text: str, voice: str, stress: str):
	print("============================")
	print("Original text:", text)
	print("Voice", voice)
	print("Stress:", stress)
	print("Time:", datetime.utcnow())
	autostress_with_model = (
	True if stress == StressOption.AutomaticStressWithModel.value else False
	)
	speaker_name = "mykyta"
	if voice == VoiceOption.Olena.value:
	speaker_name = "olena"
	elif voice == VoiceOption.Lada.value:
	speaker_name = "lada"
	text = preprocess_text(text, autostress_with_model)
	text_limit = 7200
	text = (
	text if len(text) < text_limit else text[0:text_limit]
	) # mitigate crashes on hf space
	print("Converted:", text)

	with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
	with torch.no_grad():
	wavs = synthesizer.tts(text, speaker_name=speaker_name)
	synthesizer.save_wav(wavs, fp)
	return fp.name, text


	with open("README.md") as file:
	article = file.read()
	article = article[article.find("---\n", 4) + 5::]


	iface = gr.Interface(
	fn=tts,
	inputs=[
	gr.inputs.Textbox(
	label="Input",
	default="Введіть, будь ласка, своє р+ечення.",
	),
	gr.inputs.Radio(
	label="Голос",
	choices=[option.value for option in VoiceOption],
	default=VoiceOption.Olena.value,
	),
	gr.inputs.Radio(
	label="Наголоси",
	choices=[option.value for option in StressOption],
	),
	],
	outputs=[
	gr.outputs.Audio(label="Output"),
	gr.outputs.Textbox(label="Наголошений текст"),
	],
	title="🐸💬🇺🇦 - Coqui TTS",
	description="Україномовний🇺🇦 TTS за допомогою Coqui TTS (щоб вручну поставити наголос, використовуйте + перед голосною)",
	article=article + f'\n <center><img src="{badge}" alt="visitors badge"/></center>',
	examples=[
	[
	"Введіть, будь ласка, своє речення.",
	VoiceOption.Olena.value,
	StressOption.AutomaticStress.value,
	],
	[
	"Введіть, будь ласка, своє речення.",
	VoiceOption.Mykyta.value,
	StressOption.AutomaticStress.value,
	],
	[
	"Вв+едіть, будь ласка, св+оє реч+ення.",
	VoiceOption.Mykyta.value,
	StressOption.AutomaticStress.value,
	],
	[
	"Привіт, як тебе звати?",
	VoiceOption.Olena.value,
	StressOption.AutomaticStress.value,
	],
	[
	"Договір підписано 4 квітня 1949 року.",
	VoiceOption.Lada.value,
	StressOption.AutomaticStress.value,
	],
	],
	)
	iface.launch(enable_queue=True)