| |
| |
| |
| |
| |
| |
|
|
| train_timesteps: 50 |
| beta_start: 0.0001 |
| beta_end: 0.05 |
|
|
| residual_layers: 30 |
| residual_channels: 64 |
| dilation_cycle_length: 10 |
|
|
| unconditional: False |
|
|
| spec_n_mels: 80 |
| spec_hop_length: 256 |
|
|
| diffwave: !new:speechbrain.lobes.models.DiffWave.DiffWave |
| input_channels: !ref <spec_n_mels> |
| residual_layers: !ref <residual_layers> |
| residual_channels: !ref <residual_channels> |
| dilation_cycle_length: !ref <dilation_cycle_length> |
| total_steps: !ref <train_timesteps> |
| unconditional: !ref <unconditional> |
|
|
| noise: !new:speechbrain.nnet.diffusion.GaussianNoise |
|
|
| diffusion: !new:speechbrain.lobes.models.DiffWave.DiffWaveDiffusion |
| model: !ref <diffwave> |
| beta_start: !ref <beta_start> |
| beta_end: !ref <beta_end> |
| timesteps: !ref <train_timesteps> |
| noise: !ref <noise> |
|
|
| modules: |
| diffwave: !ref <diffwave> |
| diffusion: !ref <diffusion> |
|
|
| pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer |
| loadables: |
| diffwave: !ref <diffwave> |
|
|