File size: 1,152 Bytes
e2866fd |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 |
# ################################################
# Basic parameters for a diffwave vocoder
#
# Author:
# * Yingzhi Wang 2022
# ################################################
train_timesteps: 50
beta_start: 0.0001
beta_end: 0.05
residual_layers: 30
residual_channels: 64
dilation_cycle_length: 10
unconditional: False
spec_n_mels: 80
spec_hop_length: 256
diffwave: !new:speechbrain.lobes.models.DiffWave.DiffWave
input_channels: !ref <spec_n_mels>
residual_layers: !ref <residual_layers>
residual_channels: !ref <residual_channels>
dilation_cycle_length: !ref <dilation_cycle_length>
total_steps: !ref <train_timesteps>
unconditional: !ref <unconditional>
noise: !new:speechbrain.nnet.diffusion.GaussianNoise
diffusion: !new:speechbrain.lobes.models.DiffWave.DiffWaveDiffusion
model: !ref <diffwave>
beta_start: !ref <beta_start>
beta_end: !ref <beta_end>
timesteps: !ref <train_timesteps>
noise: !ref <noise>
modules:
diffwave: !ref <diffwave>
diffusion: !ref <diffusion>
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
loadables:
diffwave: !ref <diffwave>
|