Spaces:
Running
Running
Tacatron2-TTS
/
pretrained_models
/MelSpectrogramEncoder-834735cd05736696f9a5c70acdba6396
/hyperparams.yaml
sample_rate: 16000 | |
hop_length: 256 | |
win_length: 1024 | |
n_mel_channels: 80 | |
n_fft: 1024 | |
mel_fmin: 0.0 | |
mel_fmax: 8000.0 | |
mel_normalized: False | |
power: 1 | |
norm: "slaney" | |
mel_scale: "slaney" | |
dynamic_range_compression: True | |
# Modules | |
embedding_model: !new:speechbrain.lobes.models.ECAPA_TDNN.ECAPA_TDNN | |
input_size: !ref <n_mel_channels> | |
channels: [1024, 1024, 1024, 1024, 3072] | |
kernel_sizes: [5, 3, 3, 3, 1] | |
dilations: [1, 2, 3, 4, 1] | |
groups: [1, 1, 1, 1, 1] | |
attention_channels: 128 | |
lin_neurons: 192 | |
normalizer: !new:speechbrain.processing.features.InputNormalization | |
norm_type: sentence | |
std_norm: False | |
modules: | |
normalizer: !ref <normalizer> | |
embedding_model: !ref <embedding_model> | |
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer | |
loadables: | |
normalizer: !ref <normalizer> | |
embedding_model: !ref <embedding_model> | |