File size: 2,860 Bytes
c885237 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 |
allow_cache: false
batch_max_steps: 22528
batch_size: 32
config: conf/style_melgan.v1.yaml
dev_dumpdir: dump/dev_1and2/norm
dev_feats_scp: null
dev_segments: null
dev_wav_scp: null
discriminator_adv_loss_params:
average_by_discriminators: false
discriminator_grad_norm: -1
discriminator_optimizer_params:
betas:
- 0.5
- 0.9
lr: 0.0002
weight_decay: 0.0
discriminator_optimizer_type: Adam
discriminator_params:
discriminator_params:
bias: true
channels: 16
downsample_scales:
- 4
- 4
- 4
- 1
kernel_sizes:
- 5
- 3
max_downsample_channels: 512
nonlinear_activation: LeakyReLU
nonlinear_activation_params:
negative_slope: 0.2
out_channels: 1
pqmf_params:
- - 1
- None
- None
- None
- - 2
- 62
- 0.267
- 9.0
- - 4
- 62
- 0.142
- 9.0
- - 8
- 62
- 0.07949
- 9.0
repeats: 4
use_weight_norm: true
window_sizes:
- 512
- 1024
- 2048
- 4096
discriminator_scheduler_params:
gamma: 0.5
milestones:
- 200000
- 400000
- 600000
- 800000
discriminator_scheduler_type: MultiStepLR
discriminator_train_start_steps: 100000
discriminator_type: StyleMelGANDiscriminator
distributed: false
eval_interval_steps: 1000
fft_size: 1024
fmax: 7600
fmin: 80
format: hdf5
generator_adv_loss_params:
average_by_discriminators: false
generator_grad_norm: -1
generator_optimizer_params:
betas:
- 0.5
- 0.9
lr: 0.0001
weight_decay: 0.0
generator_optimizer_type: Adam
generator_params:
aux_channels: 80
bias: true
channels: 64
dilation: 2
gated_function: softmax
in_channels: 128
kernel_size: 9
noise_upsample_activation: LeakyReLU
noise_upsample_activation_params:
negative_slope: 0.2
noise_upsample_scales:
- 11
- 2
- 2
- 2
out_channels: 1
upsample_mode: nearest
upsample_scales:
- 2
- 2
- 2
- 2
- 2
- 2
- 2
- 2
- 1
use_weight_norm: true
generator_scheduler_params:
gamma: 0.5
milestones:
- 100000
- 300000
- 500000
- 700000
- 900000
generator_scheduler_type: MultiStepLR
generator_type: StyleMelGANGenerator
global_gain_scale: 1.0
hop_size: 256
lambda_adv: 1.0
lambda_aux: 1.0
log_interval_steps: 100
num_mels: 80
num_save_intermediate_results: 4
num_workers: 2
outdir: exp/train_1and2_style_melgan.v1
pin_memory: true
pretrain: ''
rank: 0
remove_short_samples: false
resume: ''
sampling_rate: 22050
save_interval_steps: 50000
stft_loss_params:
fft_sizes:
- 1024
- 2048
- 512
hop_sizes:
- 120
- 240
- 50
win_lengths:
- 600
- 1200
- 240
window: hann_window
train_dumpdir: dump/train_1and2/norm
train_feats_scp: null
train_max_steps: 1500000
train_segments: null
train_wav_scp: null
trim_frame_size: 1024
trim_hop_size: 256
trim_silence: false
trim_threshold_in_db: 60
verbose: 1
version: 0.6.0
win_length: null
window: hann
|