File size: 610 Bytes
85664f1
 
ee12d4e
85664f1
 
 
 
 
 
1938514
1
2
3
4
5
6
7
8
9
10
import os

os.system("git clone --branch v2.4 https://github.com/DigitalPhonetics/IMS-Toucan.git toucan_codebase")
os.system("mv toucan_codebase/* .")

from run_model_downloader import download_models
from run_gradio_demo import TTSWebUI

download_models()
TTSWebUI(gpu_id="cpu", title="Design a Speaker", article="We use a GAN to generate a speaker embedding for the TTS to use. The GAN has a control mechanism integrated, so you can directly influence the generated embeddings in multiple intuitive ways! When combining this with a bunch of simple heuristic controls, there's quite a lot that you can edit.")