|
--- |
|
task_name: audioset |
|
|
|
data: |
|
indexes_dict: "hdf5s/indexes/full_train.h5" |
|
sampler_type: balanced_sampler |
|
anchor_segment_detect_mode: max_area |
|
sample_rate: 32000 |
|
frames_per_second: 100 |
|
segment_seconds: 2.0 |
|
classes_num: 527 |
|
augmentation: |
|
match_energy: True |
|
mix_num: 2 |
|
|
|
sound_event_detection: |
|
model_type: Cnn14_DecisionLevelMax |
|
freeze: True |
|
|
|
query_net: |
|
model_type: Cnn14_Wrapper |
|
base_checkpoint_type: "Cnn14" |
|
freeze_base: True |
|
freeze_adaptor: False |
|
bottleneck_type: at_soft |
|
outputs_num: 527 |
|
|
|
ss_model: |
|
model_type: ResUNet30 |
|
input_channels: 1 |
|
output_channels: 1 |
|
|
|
train: |
|
num_workers: 16 |
|
loss_type: l1_wav |
|
optimizer: |
|
optimizer_type: AdamW |
|
learning_rate: 1e-3 |
|
lr_lambda_type: constant_warm_up |
|
warm_up_steps: 10000 |
|
reduce_lr_steps: 1000000 |
|
batch_size_per_device: 16 |
|
precision: 32 |
|
steps_per_epoch: 10000 |
|
evaluate_step_frequency: 20000 |
|
save_step_frequency: 100000 |
|
early_stop_steps: 10000001 |
|
random_seed: 1234 |
|
resume_checkpoint_path: "" |
|
|
|
evaluate: |
|
balanced_train_eval_dir: "evaluation/audioset/2s_segments_balanced_train" |
|
test_eval_dir: "evaluation/audioset/2s_segments_test" |
|
max_eval_per_class: 10 |
|
|