File size: 1,892 Bytes
350b90e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
accumulate_grad_batches: 1
audio_sample_rate: 44100
binarization_args:
  num_workers: 0
  shuffle: true
binarizer_cls: preprocessing.MIDIExtractionBinarizer
binary_data_dir: data/some_ds_fixmel_spk3_aug8/binary
clip_grad_norm: 1
dataloader_prefetch_factor: 2
ddp_backend: nccl
ds_workers: 4
finetune_ckpt_path: null
finetune_enabled: false
finetune_ignored_params: []
finetune_strict_shapes: true
fmax: 8000
fmin: 40
freezing_enabled: false
frozen_params: []
hop_size: 512
log_interval: 100
lr_scheduler_args:
  min_lr: 1.0e-05
  scheduler_cls: lr_scheduler.scheduler.WarmupLR
  warmup_steps: 5000
max_batch_frames: 80000
max_batch_size: 8
max_updates: 10000000
max_val_batch_frames: 10000
max_val_batch_size: 1
midi_extractor_args:
  attention_drop: 0.1
  attention_heads: 8
  attention_heads_dim: 64
  conv_drop: 0.1
  dim: 512
  ffn_latent_drop: 0.1
  ffn_out_drop: 0.1
  kernel_size: 31
  lay: 8
  use_lay_skip: true
midi_max: 128
midi_min: 0
midi_num_bins: 256
midi_prob_deviation: 0.5
midi_shift_proportion: 0.0
midi_shift_range:
- -6
- 6
model_cls: modules.model.Gmidi_conform.midi_conforms
num_ckpt_keep: 5
num_sanity_val_steps: 1
num_valid_plots: 300
optimizer_args:
  beta1: 0.9
  beta2: 0.98
  lr: 0.0001
  optimizer_cls: torch.optim.AdamW
  weight_decay: 0
pe: rmvpe
pe_ckpt: pretrained/rmvpe/model.pt
permanent_ckpt_interval: 40000
permanent_ckpt_start: 200000
pl_trainer_accelerator: auto
pl_trainer_devices: auto
pl_trainer_num_nodes: 1
pl_trainer_precision: 32-true
pl_trainer_strategy: auto
raw_data_dir: []
rest_threshold: 0.1
sampler_frame_count_grid: 6
seed: 114514
sort_by_len: true
task_cls: training.MIDIExtractionTask
test_prefixes: null
train_set_name: train
units_dim: 80
units_encoder: mel
units_encoder_ckpt: pretrained/contentvec/checkpoint_best_legacy_500.pt
use_buond_loss: true
use_midi_loss: true
val_check_interval: 4000
valid_set_name: valid
win_size: 2048