add vocos config to hub
Browse files- Dockerfile +2 -0
- config_22khz.yaml +0 -24
- infer_onnx.py +1 -1
Dockerfile
CHANGED
@@ -44,6 +44,8 @@ RUN huggingface-cli download BSC-LT/matcha-tts-cat-onnx matcha_multispeaker_cat_
|
|
44 |
|
45 |
RUN huggingface-cli download BSC-LT/vocos-mel-22khz-onnx mel_spec_22khz_v2.onnx --local-dir $HOME/app/
|
46 |
|
|
|
|
|
47 |
COPY --chown=user . $HOME/app/
|
48 |
|
49 |
# Fix ownership issues
|
|
|
44 |
|
45 |
RUN huggingface-cli download BSC-LT/vocos-mel-22khz-onnx mel_spec_22khz_v2.onnx --local-dir $HOME/app/
|
46 |
|
47 |
+
RUN huggingface-cli download BSC-LT/vocos-mel-22khz-onnx config.yaml --local-dir $HOME/app/
|
48 |
+
|
49 |
COPY --chown=user . $HOME/app/
|
50 |
|
51 |
# Fix ownership issues
|
config_22khz.yaml
DELETED
@@ -1,24 +0,0 @@
|
|
1 |
-
feature_extractor:
|
2 |
-
class_path: vocos.feature_extractors.MelSpectrogramFeatures
|
3 |
-
init_args:
|
4 |
-
sample_rate: 22050
|
5 |
-
n_fft: 1024
|
6 |
-
hop_length: 256
|
7 |
-
n_mels: 80
|
8 |
-
padding: center
|
9 |
-
|
10 |
-
backbone:
|
11 |
-
class_path: vocos.models.VocosBackbone
|
12 |
-
init_args:
|
13 |
-
input_channels: 80
|
14 |
-
dim: 512
|
15 |
-
intermediate_dim: 1536
|
16 |
-
num_layers: 8
|
17 |
-
|
18 |
-
head:
|
19 |
-
class_path: vocos.heads.ISTFTHead
|
20 |
-
init_args:
|
21 |
-
dim: 512
|
22 |
-
n_fft: 1024
|
23 |
-
hop_length: 256
|
24 |
-
padding: center
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
infer_onnx.py
CHANGED
@@ -33,7 +33,7 @@ def process_text(i: int, text: str, device: torch.device):
|
|
33 |
MODEL_PATH_MATCHA_MEL="matcha_multispeaker_cat_opset_15_10_steps_lastwords.onnx"
|
34 |
MODEL_PATH_MATCHA="matcha_hifigan_multispeaker_cat.onnx"
|
35 |
MODEL_PATH_VOCOS="mel_spec_22khz_v2.onnx"
|
36 |
-
CONFIG_PATH="
|
37 |
SPEAKER_ID_DICT="spk_to_id.json"
|
38 |
|
39 |
sess_options = onnxruntime.SessionOptions()
|
|
|
33 |
MODEL_PATH_MATCHA_MEL="matcha_multispeaker_cat_opset_15_10_steps_lastwords.onnx"
|
34 |
MODEL_PATH_MATCHA="matcha_hifigan_multispeaker_cat.onnx"
|
35 |
MODEL_PATH_VOCOS="mel_spec_22khz_v2.onnx"
|
36 |
+
CONFIG_PATH="config.yaml"
|
37 |
SPEAKER_ID_DICT="spk_to_id.json"
|
38 |
|
39 |
sess_options = onnxruntime.SessionOptions()
|