Flux9665's picture
Update app.py
1938514
raw
history blame
610 Bytes
import os
os.system("git clone --branch v2.4 https://github.com/DigitalPhonetics/IMS-Toucan.git toucan_codebase")
os.system("mv toucan_codebase/* .")
from run_model_downloader import download_models
from run_gradio_demo import TTSWebUI
download_models()
TTSWebUI(gpu_id="cpu", title="Design a Speaker", article="We use a GAN to generate a speaker embedding for the TTS to use. The GAN has a control mechanism integrated, so you can directly influence the generated embeddings in multiple intuitive ways! When combining this with a bunch of simple heuristic controls, there's quite a lot that you can edit.")