|
{ |
|
"_name_or_path": "Bingsu/torchaudio_tacotron2", |
|
"architectures": [ |
|
"Tacotron2Model" |
|
], |
|
"attention_dropout": 0.1, |
|
"attention_hidden_dim": 128, |
|
"attention_location_kernel_size": 31, |
|
"attention_location_n_filter": 32, |
|
"attention_rnn_dim": 1024, |
|
"auto_map": { |
|
"AutoConfig": "modeling_tacotron2.Tacotron2Config", |
|
"AutoModel": "modeling_tacotron2.Tacotron2Model", |
|
"AutoModelForPreTraining": "modeling_tacotron2.Tacotron2ForPreTraining" |
|
}, |
|
"decoder_dropout": 0.1, |
|
"decoder_early_stopping": true, |
|
"decoder_max_step": 2000, |
|
"decoder_rnn_dim": 1024, |
|
"encoder_embedding_dim": 512, |
|
"encoder_kernel_size": 5, |
|
"encoder_n_convolution": 3, |
|
"gate_threshold": 0.5, |
|
"mask_padding": false, |
|
"n_frames_per_step": 1, |
|
"n_mels": 80, |
|
"n_symbol": 392, |
|
"postnet_embedding_dim": 512, |
|
"postnet_kernel_size": 5, |
|
"postnet_n_convolution": 5, |
|
"prenet_dim": 256, |
|
"symbol_embedding_dim": 512, |
|
"torch_dtype": "float32", |
|
"transformers_version": "4.25.1" |
|
} |
|
|