File size: 2,860 Bytes
c885237
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
allow_cache: false
batch_max_steps: 22528
batch_size: 32
config: conf/style_melgan.v1.yaml
dev_dumpdir: dump/dev_1and2/norm
dev_feats_scp: null
dev_segments: null
dev_wav_scp: null
discriminator_adv_loss_params:
  average_by_discriminators: false
discriminator_grad_norm: -1
discriminator_optimizer_params:
  betas:
  - 0.5
  - 0.9
  lr: 0.0002
  weight_decay: 0.0
discriminator_optimizer_type: Adam
discriminator_params:
  discriminator_params:
    bias: true
    channels: 16
    downsample_scales:
    - 4
    - 4
    - 4
    - 1
    kernel_sizes:
    - 5
    - 3
    max_downsample_channels: 512
    nonlinear_activation: LeakyReLU
    nonlinear_activation_params:
      negative_slope: 0.2
    out_channels: 1
  pqmf_params:
  - - 1
    - None
    - None
    - None
  - - 2
    - 62
    - 0.267
    - 9.0
  - - 4
    - 62
    - 0.142
    - 9.0
  - - 8
    - 62
    - 0.07949
    - 9.0
  repeats: 4
  use_weight_norm: true
  window_sizes:
  - 512
  - 1024
  - 2048
  - 4096
discriminator_scheduler_params:
  gamma: 0.5
  milestones:
  - 200000
  - 400000
  - 600000
  - 800000
discriminator_scheduler_type: MultiStepLR
discriminator_train_start_steps: 100000
discriminator_type: StyleMelGANDiscriminator
distributed: false
eval_interval_steps: 1000
fft_size: 1024
fmax: 7600
fmin: 80
format: hdf5
generator_adv_loss_params:
  average_by_discriminators: false
generator_grad_norm: -1
generator_optimizer_params:
  betas:
  - 0.5
  - 0.9
  lr: 0.0001
  weight_decay: 0.0
generator_optimizer_type: Adam
generator_params:
  aux_channels: 80
  bias: true
  channels: 64
  dilation: 2
  gated_function: softmax
  in_channels: 128
  kernel_size: 9
  noise_upsample_activation: LeakyReLU
  noise_upsample_activation_params:
    negative_slope: 0.2
  noise_upsample_scales:
  - 11
  - 2
  - 2
  - 2
  out_channels: 1
  upsample_mode: nearest
  upsample_scales:
  - 2
  - 2
  - 2
  - 2
  - 2
  - 2
  - 2
  - 2
  - 1
  use_weight_norm: true
generator_scheduler_params:
  gamma: 0.5
  milestones:
  - 100000
  - 300000
  - 500000
  - 700000
  - 900000
generator_scheduler_type: MultiStepLR
generator_type: StyleMelGANGenerator
global_gain_scale: 1.0
hop_size: 256
lambda_adv: 1.0
lambda_aux: 1.0
log_interval_steps: 100
num_mels: 80
num_save_intermediate_results: 4
num_workers: 2
outdir: exp/train_1and2_style_melgan.v1
pin_memory: true
pretrain: ''
rank: 0
remove_short_samples: false
resume: ''
sampling_rate: 22050
save_interval_steps: 50000
stft_loss_params:
  fft_sizes:
  - 1024
  - 2048
  - 512
  hop_sizes:
  - 120
  - 240
  - 50
  win_lengths:
  - 600
  - 1200
  - 240
  window: hann_window
train_dumpdir: dump/train_1and2/norm
train_feats_scp: null
train_max_steps: 1500000
train_segments: null
train_wav_scp: null
trim_frame_size: 1024
trim_hop_size: 256
trim_silence: false
trim_threshold_in_db: 60
verbose: 1
version: 0.6.0
win_length: null
window: hann