wl-dub / requirements_xtts.txt
r3gm's picture
v0.5.0
b152010
raw
history blame
884 Bytes
# core deps
numpy==1.23.5
cython>=0.29.30
scipy>=1.11.2
torch
torchaudio
soundfile
librosa
scikit-learn
numba
inflect>=5.6.0
tqdm>=4.64.1
anyascii>=0.3.0
pyyaml>=6.0
fsspec>=2023.6.0 # <= 2023.9.1 makes aux tests fail
aiohttp>=3.8.1
packaging>=23.1
# deps for examples
flask>=2.0.1
# deps for inference
pysbd>=0.3.4
# deps for notebooks
umap-learn>=0.5.1
pandas
# deps for training
matplotlib
# coqui stack
trainer>=0.0.32
# config management
coqpit>=0.0.16
# chinese g2p deps
jieba
pypinyin
# korean
hangul_romanize
# gruut+supported langs
gruut[de,es,fr]==2.2.3
# deps for korean
jamo
nltk
g2pkk>=0.1.1
# deps for bangla
bangla
bnnumerizer
bnunicodenormalizer
#deps for tortoise
einops>=0.6.0
transformers
#deps for bark
encodec>=0.1.1
# deps for XTTS
unidecode>=1.3.2
num2words
spacy[ja]>=3
# after this
# pip install -r requirements_xtts.txt
# pip install TTS==0.21.1 --no-deps