File size: 954 Bytes
605f8dd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
# General dependencies
beautifulsoup4
ffmpeg-python>=0.2.0
numpy==1.23.5
requests==2.31.0
tqdm
wget
six>=1.16
samplerate==0.1.0
pyyaml
ml_collections

# Audio processing
faiss-cpu==1.7.3
librosa==0.9.2
pydub==0.25.1
pyworld==0.3.4
praat-parselmouth==0.4.2
resampy==0.4.2
scipy==1.11.1
sounddevice==0.4.6
soundfile==0.12.1
torchaudio==2.1.1
praat-parselmouth
noisereduce
audio_upscaler==0.1.4

# Machine learning
git+https://github.com/IAHispano/fairseq; sys_platform == 'linux'
fairseq==0.12.2; sys_platform == 'win32'
numba; sys_platform == 'linux'
numba==0.56.4; sys_platform == 'win32'
onnxruntime
onnxruntime_gpu==1.15.1
onnx2torch>=1.5
torch==2.1.1
torchcrepe==0.0.22
torchgen>=0.0.1
torch_directml
torchvision==0.16.1
einops
local-attention
onnx>=1.14
onnxruntime
onnxruntime_gpu==1.15.1

# Visualization
matplotlib==3.7.2
tensorboard

# Miscellaneous
ffmpy==0.3.1
tensorboardX
edge-tts==6.1.9
julius>=0.2
diffq>=0.2

# API
pydantic
fastapi
uvicorn