File size: 1,822 Bytes
1037d04
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
[train]
seed = 43
device = 
model = deepfilternet2
jit = false
mask_only = false
df_only = false
batch_size = 96
batch_size_eval = 128
num_workers = 16
max_sample_len_s = 3.0
p_atten_lim = 0.0
p_reverb = 0.1
overfit = false
max_epochs = 100
log_freq = 100
log_timings = False
validation_criteria = loss
validation_criteria_rule = min
early_stopping_patience = 15
global_ds_sampling_f = 1
num_prefetch_batches = 8
dataloader_snrs = -5,0,5,10,20,40
detect_anomaly = false
batch_size_scheduling = 0/8,1/16,2/24,5/32,10/64,20/128,40/9999
start_eval = true
validation_set_caching = false

[df]
sr = 48000
fft_size = 960
hop_size = 480
nb_erb = 32
nb_df = 96
norm_tau = 1
lsnr_max = 35
lsnr_min = -15
min_nb_erb_freqs = 2
pad_mode = input_specf

[deepfilternet]
conv_lookahead = 2
conv_ch = 64
conv_depthwise = True
emb_hidden_dim = 256
emb_num_layers = 3
gru_groups = 8
linear_groups = 8
conv_dec_mode = transposed
convt_depthwise = True
mask_pf = False
df_order = 5
df_lookahead = 2
df_hidden_dim = 256
df_num_layers = 2
dfop_method = df
group_shuffle = False
conv_kernel = 1,3
df_gru_skip = none
df_output_layer = groupedlinear
gru_type = squeeze
df_pathway_kernel_size_t = 5
df_n_iter = 1
enc_concat = True
conv_kernel_inp = 3,3

[localsnrloss]
factor = 1e-3

[maskloss]
factor = 0
mask = iam
gamma = 0.6
gamma_pred = 0.6
f_under = 1

[spectralloss]
factor_magnitude = 1000
factor_complex = 1000
gamma = 0.3

[dfalphaloss]
factor = 0.0

[multiresspecloss]
factor = 500
factor_complex = 500
gamma = 0.3
fft_sizes = 256,512,1024

[optim]
lr = 0.001
momentum = 0
weight_decay = 1e-12
weight_decay_end = 0.05
optimizer = adamw
lr_min = 1e-06
lr_warmup = 0.0001
warmup_epochs = 3
lr_cycle_mul = 1.0
lr_cycle_decay = 0.5
lr_cycle_limit = 1
lr_update_per_epoch = False
lr_cycle_epochs = -1

[sdrloss]
factor = 0.0
segmental_ws = 0