|
additional_config: null |
|
allow_cache: true |
|
batch_size: 2 |
|
collater_type: NARVCCollater |
|
config: conf/aas_vc.melmelmel.v1.yaml |
|
criterions: |
|
ForwardSumLoss: {} |
|
L1Loss: {} |
|
StochasticDurationPredictorLoss: {} |
|
dev_dp_input_dir: dump/male_dev/norm_self |
|
dev_duration_dir: null |
|
distributed: false |
|
dp_train_start_steps: 0 |
|
duration_predictor_feat: mel |
|
eval_interval_steps: 100 |
|
feat_list: |
|
mel: {} |
|
fft_size: 2048 |
|
fmax: null |
|
fmin: 0 |
|
format: hdf5 |
|
global_gain_scale: 1.0 |
|
grad_norm: 1.0 |
|
gradient_accumulate_steps: 8 |
|
hop_size: 512 |
|
init_checkpoint: '' |
|
lambda_align: 2.0 |
|
log_interval_steps: 10 |
|
model_params: |
|
adim: 384 |
|
aheads: 2 |
|
conformer_dec_kernel_size: 15 |
|
conformer_enc_kernel_size: 15 |
|
conformer_pos_enc_layer_type: rel_pos |
|
conformer_self_attn_layer_type: rel_selfattn |
|
decoder_normalize_before: true |
|
decoder_reduction_factor: 1 |
|
decoder_type: conformer |
|
dlayers: 4 |
|
dunits: 1536 |
|
duration_predictor_chans: 256 |
|
duration_predictor_input_dim: 80 |
|
duration_predictor_kernel_size: 3 |
|
duration_predictor_layers: 2 |
|
duration_predictor_type: stochastic |
|
duration_predictor_use_encoder_outputs: false |
|
elayers: 4 |
|
encoder_input_layer: linear |
|
encoder_normalize_before: true |
|
encoder_reduction_factor: 1 |
|
encoder_type: conformer |
|
eunits: 1536 |
|
idim: 80 |
|
init_type: xavier_uniform |
|
odim: 80 |
|
positionwise_conv_kernel_size: 1 |
|
positionwise_layer_type: linear |
|
post_encoder_reduction_factor: 4 |
|
postnet_chans: 256 |
|
postnet_filts: 5 |
|
postnet_layers: 5 |
|
transformer_dec_attn_dropout_rate: 0.2 |
|
transformer_dec_dropout_rate: 0.2 |
|
transformer_dec_positional_dropout_rate: 0.2 |
|
transformer_enc_attn_dropout_rate: 0.2 |
|
transformer_enc_dropout_rate: 0.2 |
|
transformer_enc_positional_dropout_rate: 0.2 |
|
use_cnn_in_conformer: true |
|
use_macaron_style_in_conformer: true |
|
use_masking: true |
|
model_type: AASVC |
|
mp: false |
|
num_mels: 80 |
|
num_save_intermediate_results: 4 |
|
num_workers: 0 |
|
optimizer_params: |
|
lr: 8.0e-05 |
|
optimizer_type: Adam |
|
outdir: exp/male_female_aas_vc.melmelmel.v1 |
|
pin_memory: true |
|
rank: 0 |
|
resume: '' |
|
sampling_rate: 48000 |
|
save_interval_steps: 5000 |
|
scheduler: warmuplr |
|
scheduler_params: |
|
warmup_steps: 4000 |
|
src_dev_dumpdir: dump/male_dev/norm_self |
|
src_feat: mel |
|
src_feat_type: mel |
|
src_train_dumpdir: dump/male_train_parallel/norm_self |
|
train_dp_input_dir: dump/male_train_parallel/norm_self |
|
train_duration_dir: null |
|
train_max_steps: 100000 |
|
trainer_type: AASVCTrainer |
|
trg_dev_dumpdir: dump/female_dev/norm_self |
|
trg_feat: mel |
|
trg_feat_type: mel |
|
trg_stats: exp/male_female_aas_vc.melmelmel.v1/stats.h5 |
|
trg_train_dumpdir: dump/female_train_parallel/norm_self |
|
trim_frame_size: 2048 |
|
trim_hop_size: 512 |
|
trim_silence: false |
|
trim_threshold_in_db: 60 |
|
verbose: 1 |
|
version: 0.1.0 |
|
vocoder: |
|
checkpoint: /data/group1/z44476r/Experiments/ParallelWaveGAN/egs/hificaptain_jp_female/voc1/exp/train_parallel_parallel_wavegan.v1/checkpoint-400000steps.pkl |
|
config: /data/group1/z44476r/Experiments/ParallelWaveGAN/egs/hificaptain_jp_female/voc1/exp/train_parallel_parallel_wavegan.v1/config.yml |
|
stats: /data/group1/z44476r/Experiments/ParallelWaveGAN/egs/hificaptain_jp_female/voc1/exp/train_parallel_parallel_wavegan.v1/stats.h5 |
|
win_length: null |
|
window: hann |
|
|