Spaces:
Running
on
Zero
Running
on
Zero
Update ldm/modules/encoders/CLAP/config.yaml
Browse files
ldm/modules/encoders/CLAP/config.yaml
CHANGED
@@ -1,26 +1,26 @@
|
|
1 |
-
# TEXT ENCODER CONFIG
|
2 |
-
text_model: '
|
3 |
-
text_len: 100
|
4 |
-
transformer_embed_dim: 768
|
5 |
-
freeze_text_encoder_weights: True
|
6 |
-
|
7 |
-
# AUDIO ENCODER CONFIG
|
8 |
-
audioenc_name: 'Cnn14'
|
9 |
-
out_emb: 2048
|
10 |
-
sampling_rate: 44100
|
11 |
-
duration: 5
|
12 |
-
fmin: 50
|
13 |
-
fmax: 14000
|
14 |
-
n_fft: 1028
|
15 |
-
hop_size: 320
|
16 |
-
mel_bins: 64
|
17 |
-
window_size: 1024
|
18 |
-
|
19 |
-
# PROJECTION SPACE CONFIG
|
20 |
-
d_proj: 1024
|
21 |
-
temperature: 0.003
|
22 |
-
|
23 |
-
# TRAINING AND EVALUATION CONFIG
|
24 |
-
num_classes: 527
|
25 |
-
batch_size: 1024
|
26 |
-
demo: False
|
|
|
1 |
+
# TEXT ENCODER CONFIG
|
2 |
+
text_model: 'ldm/modules/encoders/CLAP/bert-base-uncased'
|
3 |
+
text_len: 100
|
4 |
+
transformer_embed_dim: 768
|
5 |
+
freeze_text_encoder_weights: True
|
6 |
+
|
7 |
+
# AUDIO ENCODER CONFIG
|
8 |
+
audioenc_name: 'Cnn14'
|
9 |
+
out_emb: 2048
|
10 |
+
sampling_rate: 44100
|
11 |
+
duration: 5
|
12 |
+
fmin: 50
|
13 |
+
fmax: 14000
|
14 |
+
n_fft: 1028
|
15 |
+
hop_size: 320
|
16 |
+
mel_bins: 64
|
17 |
+
window_size: 1024
|
18 |
+
|
19 |
+
# PROJECTION SPACE CONFIG
|
20 |
+
d_proj: 1024
|
21 |
+
temperature: 0.003
|
22 |
+
|
23 |
+
# TRAINING AND EVALUATION CONFIG
|
24 |
+
num_classes: 527
|
25 |
+
batch_size: 1024
|
26 |
+
demo: False
|