|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
train_timesteps: 50 |
|
beta_start: 0.0001 |
|
beta_end: 0.05 |
|
|
|
residual_layers: 30 |
|
residual_channels: 64 |
|
dilation_cycle_length: 10 |
|
|
|
unconditional: False |
|
|
|
spec_n_mels: 80 |
|
spec_hop_length: 256 |
|
|
|
diffwave: !new:speechbrain.lobes.models.DiffWave.DiffWave |
|
input_channels: !ref <spec_n_mels> |
|
residual_layers: !ref <residual_layers> |
|
residual_channels: !ref <residual_channels> |
|
dilation_cycle_length: !ref <dilation_cycle_length> |
|
total_steps: !ref <train_timesteps> |
|
unconditional: !ref <unconditional> |
|
|
|
noise: !new:speechbrain.nnet.diffusion.GaussianNoise |
|
|
|
diffusion: !new:speechbrain.lobes.models.DiffWave.DiffWaveDiffusion |
|
model: !ref <diffwave> |
|
beta_start: !ref <beta_start> |
|
beta_end: !ref <beta_end> |
|
timesteps: !ref <train_timesteps> |
|
noise: !ref <noise> |
|
|
|
modules: |
|
diffwave: !ref <diffwave> |
|
diffusion: !ref <diffusion> |
|
|
|
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer |
|
loadables: |
|
diffwave: !ref <diffwave> |
|
|