{ | |
"base_config": "egs/vocoder/diffusion/exp_config_base.json", | |
"preprocess": { | |
// acoustic features | |
"extract_mel": true, | |
"extract_audio": true, | |
// Features used for model training | |
"use_mel": true, | |
"use_audio": true, | |
}, | |
"model": { | |
"generator": "diffwave", | |
"diffwave": { | |
"residual_channels": 64, | |
"residual_layers": 30, | |
"dilation_cycle_length": 10, | |
"noise_schedule_factors": [1.0e-4, 0.05, 50], | |
"inference_noise_schedule": [0.0001, 0.001, 0.01, 0.05, 0.2, 0.5], | |
"upsample_factors": [16, 16], | |
} | |
}, | |
"inference": { | |
"batch_size": 1, | |
} | |
} | |