gorinars commited on
Commit
d53daf9
1 Parent(s): 771a6c2

first commit

Browse files
Files changed (5) hide show
  1. .gitattributes +2 -0
  2. config.json +3 -0
  3. embedding_model.ckpt +3 -0
  4. hyperparams.yaml +59 -0
  5. normalizer.ckpt +3 -0
.gitattributes CHANGED
@@ -32,3 +32,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ normalizer.ckpt filter=lfs diff=lfs merge=lfs -text
36
+ embedding_model.ckpt filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "speechbrain_interface": "SpeakerRecognition"
3
+ }
embedding_model.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29d43ac4071329841ac35e090db7883ad44618bfbcde36f3b13219dc0b5e8367
3
+ size 301999678
hyperparams.yaml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # ############################################################################
2
+ # Model: ECAPA big for Speaker verification
3
+ # ############################################################################
4
+
5
+ # Feature parameters
6
+ n_mels: 80
7
+
8
+ # Pretrain folder (HuggingFace)
9
+ pretrained_path: gorinars/sb-cssl-vgg-sup
10
+
11
+ # Output parameters
12
+ out_n_neurons: 308
13
+
14
+ # Model params
15
+ compute_features: !new:speechbrain.lobes.features.Fbank
16
+ n_mels: 80
17
+ left_frames: 0
18
+ right_frames: 0
19
+ deltas: false
20
+ sample_rate: 16000
21
+ n_fft: 400
22
+ win_length: 25
23
+ hop_length: 10
24
+ f_min: 0
25
+
26
+
27
+ mean_var_norm: !new:speechbrain.processing.features.InputNormalization
28
+ norm_type: sentence
29
+ std_norm: False
30
+
31
+ embedding_model: !new:crytorch.models.components.pann.Cnn14
32
+ mel_bins: 80
33
+ emb_dim: 2048
34
+ norm_type: bn
35
+
36
+
37
+ classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
38
+ input_size: 2048
39
+ out_neurons: !ref <out_n_neurons>
40
+
41
+ modules:
42
+ compute_features: !ref <compute_features>
43
+ mean_var_norm: !ref <mean_var_norm>
44
+ embedding_model: !ref <embedding_model>
45
+ classifier: !ref <classifier>
46
+
47
+ label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
48
+
49
+
50
+ pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
51
+ loadables:
52
+ embedding_model: !ref <embedding_model>
53
+ #classifier: !ref <classifier>
54
+ #label_encoder: !ref <label_encoder>
55
+ paths:
56
+ embedding_model: !ref <pretrained_path>/embedding_model.ckpt
57
+ #classifier: !ref <pretrained_path>/classifier.ckpt
58
+ #label_encoder: !ref <pretrained_path>/label_encoder.txt
59
+
normalizer.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01dd629a2a24b29ad133b15930494e168114b788c4d7579ac2862e3d406e00fb
3
+ size 1063