File size: 1,723 Bytes
6efc863
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
model:
  base_learning_rate: 4.5e-06
  target: ldm.models.autoencoder1d.AutoencoderKL
  params:
    embed_dim: 20
    monitor: val/rec_loss
    ddconfig:
      double_z: true
      in_channels: 80
      out_ch: 80
      z_channels: 20
      kernel_size: 5
      ch: 384
      ch_mult:
      - 1
      - 2
      - 4
      num_res_blocks: 2
      attn_layers:
      - 3
      down_layers:
      - 0
      dropout: 0.0
    lossconfig:
      target: ldm.modules.losses_audio.contperceptual.LPAPSWithDiscriminator
      params:
        disc_start: 80001
        perceptual_weight: 0.0
        kl_weight: 1.0e-06
        disc_weight: 0.5
        disc_in_channels: 1
        disc_loss: mse
        disc_factor: 2
        disc_conditional: false
        r1_reg_weight: 3

lightning:
  callbacks:
    image_logger:
      target: main.AudioLogger
      params:
        for_specs: true
        increase_log_steps: false
        batch_frequency: 5000
        max_images: 8
        rescale: false
        melvmin: -5
        melvmax: 1.5
        vocoder_cfg:
          target: vocoder.bigvgan.models.VocoderBigVGAN
          params:
            ckpt_vocoder: vocoder/logs/bigvnat16k93.5w
  trainer:
    sync_batchnorm: false # not working with r1_regularization
    strategy: ddp


data:
  target: main.SpectrogramDataModuleFromConfig
  params:
    batch_size: 4
    num_workers: 16
    spec_dir_path: ldm/data/tsv_dirs/full_data/V1_new
    mel_num: 80
    spec_len: 624
    spec_crop_len: 624
    train:
      target: ldm.data.joinaudiodataset_624.JoinSpecsTrain
      params:
        specs_dataset_cfg: null
    validation:
      target: ldm.data.joinaudiodataset_624.JoinSpecsValidation
      params:
        specs_dataset_cfg: null