Spaces:

AnnieZzz
/

Quenya-TTS

Sleeping

Quenya-TTS / run_interactive_demo.py

Update app.py and requirements.txt

cd4e2cb verified 3 months ago

1.77 kB

	import os
	import sys
	import warnings

	import torch

	from InferenceInterfaces.ToucanTTSInterface import ToucanTTSInterface
	from Utility.storage_config import MODELS_DIR

	if __name__ == '__main__':
	warnings.filterwarnings("ignore", category=UserWarning)

	PATH_TO_TTS_MODEL = os.path.join(MODELS_DIR, "ToucanTTS_Meta", "best.pt")
	PATH_TO_VOCODER_MODEL = None # os.path.join(MODELS_DIR, "BigVGAN", "best.pt")
	PATH_TO_REFERENCE_SPEAKER = "" # audios/speaker_references_for_testing/female_high_voice.wav
	LANGUAGE = "en"
	device = "cuda" if torch.cuda.is_available() else "cpu"

	tts = ToucanTTSInterface(device=device, tts_model_path=PATH_TO_TTS_MODEL, vocoder_model_path=PATH_TO_VOCODER_MODEL, faster_vocoder=device == "cuda")
	tts.set_language(lang_id=LANGUAGE)
	if PATH_TO_REFERENCE_SPEAKER != "":
	if os.path.exists(PATH_TO_REFERENCE_SPEAKER):
	tts.set_utterance_embedding(PATH_TO_REFERENCE_SPEAKER)
	else:
	print(f"File {PATH_TO_REFERENCE_SPEAKER} could not be found, please check for typos and re-run. Using default for now.")

	print("Loading the following configuration:")
	print(f"\tTTS Model: {PATH_TO_TTS_MODEL}")
	print(f"\tVocoder Model: {PATH_TO_VOCODER_MODEL}")
	print(f"\tReference Audio: {PATH_TO_REFERENCE_SPEAKER}")
	print(f"\tLanguage Used: {LANGUAGE}")
	print(f"\tDevice Used: {device}")

	while True:
	text = input("\nWhat should I say? (or 'exit')\n")
	if text == "exit":
	sys.exit()
	tts.read_aloud(text,
	view=True,
	blocking=False,
	duration_scaling_factor=1.0,
	energy_variance_scale=1.0,
	pitch_variance_scale=1.0)