analyzer: exp/autoencoder/symADuniv_vctk_48000_hop300/checkpoint-500000steps.pkl batch_length: 9600 batch_size: 16 config: config/vocoder/AudioDec_v3_symADuniv_vctk_48000_hop300_clean.yaml data: path: /mnt/home/yichiaowu/datasets/vctk_noisy/48000 subset: test: clean_testset_wav train: clean_trainset_84spk_wav valid: clean_validset_84spk_wav disable_cudnn: 'False' discriminator_adv_loss_params: average_by_discriminators: false discriminator_grad_norm: -1 discriminator_optimizer_params: betas: - 0.5 - 0.9 lr: 0.0002 weight_decay: 0.0 discriminator_optimizer_type: Adam discriminator_params: fft_sizes: - 1024 - 2048 - 512 hop_sizes: - 120 - 240 - 50 period_discriminator_params: bias: true channels: 32 downsample_scales: - 3 - 3 - 3 - 3 - 1 in_channels: 1 kernel_sizes: - 5 - 3 max_downsample_channels: 1024 nonlinear_activation: LeakyReLU nonlinear_activation_params: negative_slope: 0.1 out_channels: 1 use_spectral_norm: false use_weight_norm: true periods: - 2 - 3 - 5 - 7 - 11 spectral_discriminator_params: bias: true channels: 32 kernel_sizes: - - 3 - 9 - - 3 - 9 - - 3 - 9 - - 3 - 9 - - 3 - 3 - - 3 - 3 nonlinear_activation: LeakyReLU nonlinear_activation_params: negative_slope: 0.2 strides: - - 1 - 1 - - 1 - 2 - - 1 - 2 - - 1 - 2 - - 1 - 1 - - 1 - 1 win_lengths: - 600 - 1200 - 240 window: hann_window discriminator_scheduler_params: gamma: 0.5 milestones: - 200000 - 400000 - 600000 - 800000 discriminator_scheduler_type: MultiStepLR discriminator_train_start_steps: 0 eval_interval_steps: 1000 exp_root: exp feat_match_loss_params: average_by_discriminators: false average_by_layers: false include_final_outputs: false generator_adv_loss_params: average_by_discriminators: false generator_grad_norm: -1 generator_optimizer_params: betas: - 0.5 - 0.9 lr: 0.0002 weight_decay: 0.0 generator_optimizer_type: Adam generator_params: bias: true channels: 512 groups: 3 in_channels: 64 kernel_size: 7 nonlinear_activation: LeakyReLU nonlinear_activation_params: negative_slope: 0.1 out_channels: 1 resblock_dilations: - - 1 - 3 - 5 resblock_kernel_sizes: - 11 stats: stats/symADuniv_vctk_48000_hop300_clean.npy upsample_kernel_sizes: - 10 - 10 - 8 - 6 upsample_scales: - 5 - 5 - 4 - 3 use_additional_convs: true use_weight_norm: true generator_scheduler_params: gamma: 0.5 milestones: - 200000 - 400000 - 600000 - 800000 generator_scheduler_type: MultiStepLR generator_train_start_steps: 1 lambda_adv: 1.0 lambda_feat_match: 2.0 lambda_mel_loss: 45.0 lambda_shape_loss: 45.0 lambda_stft_loss: 45.0 log_interval_steps: 100 mel_loss_params: fft_sizes: - 2048 fmax: 24000 fmin: 0 fs: 48000 hop_sizes: - 300 log_base: null num_mels: 80 win_lengths: - 2048 window: hann_window model_type: UnivNet num_workers: 2 outdir: exp/vocoder/AudioDec_v3_symADuniv_vctk_48000_hop300_clean pin_memory: true resume: '' sampling_rate: 48000 save_interval_steps: 100000 seed: 1337 shape_loss_params: winlen: - 300 stft_loss_params: fft_sizes: - 1024 - 2048 - 512 hop_sizes: - 120 - 240 - 50 win_lengths: - 600 - 1200 - 240 window: hann_window tag: vocoder/AudioDec_v3_symADuniv_vctk_48000_hop300_clean train_max_steps: 500000 train_mode: vocoder use_feat_match_loss: true use_mel_loss: true use_shape_loss: false use_stft_loss: false