File size: 1,108 Bytes
699157c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
general:
  stage: "ssl"
  corpus_type: "single" # (single, multi-seen, multi-unseen)
  source_path: "./data/tono"
  aux_path: null
  preprocessed_path: "./preprocessed/tono"
  output_path: "./output/vocfeats/tono"
  test_wav_path: null
  feature_type: "vocfeats"
  hifigan_path: "./hifigan/hifigan_jvs_40d_600k"
  power_norm: True
  use_gst: False

preprocess:
  n_train: 270
  n_val: 34
  n_test: 30
  sampling_rate: 22050
  frame_length: 1024
  frame_shift: 256
  fft_length: 1024
  fmin: 0
  fmax: 8000
  n_mels: 80
  cep_order: 40
  comp_factor: 1.0
  min_magnitude: 0.00001
  bitrate: "16k"
  f0_extractor: "harvest"
  max_wav_value: 32768.0
  segment_length: 2

train:
  batchsize: 4
  epoch: 50
  epoch_channel: 25
  multi_gpu_mode: False
  num_workers: 4
  learning_rate: 0.001
  alpha: 0.1
  beta: 0.1
  grad_clip_thresh: 1.0
  logger_step: 1000
  load_pretrained: False
  pretrained_path: null
  fix_channel: False
  early_stopping: False
  multi_scale_loss:
    use_linear: True
    gamma: 1.0
  feature_loss:
    type: "mae"

dual:
  enable: True
  config_path: ./configs/train/vocfeats/dual.yaml