Upload folder using huggingface_hub

Files changed (3) hide show

README.md CHANGED Viewed

@@ -14,6 +14,12 @@ tags:
 - voice-activity-detection
 - overlapped-speech-detection
 - resegmentation
-licence: mit
 ---
 This is the model card of a pyannote model that has been pushed on the Hub. This model card has been automatically generated.

 - voice-activity-detection
 - overlapped-speech-detection
 - resegmentation
+- speaker-recognition
+- speaker-verification
+- speaker-identification
+- speaker-embedding
+- PyTorch
+- wespeaker
+licence: cc-by-4.0
 ---
 This is the model card of a pyannote model that has been pushed on the Hub. This model card has been automatically generated.

config.yaml CHANGED Viewed

@@ -1,21 +1,10 @@
 model:
-  _target_: pyannote.audio.models.segmentation.PyanNet.PyanNet
-  linear:
-    hidden_size: 128
-    num_layers: 2
-  lstm:
-    batch_first: true
-    bidirectional: true
-    dropout: 0.0
-    hidden_size: 128
-    monolithic: true
-    num_layers: 4
   num_channels: 1
   sample_rate: 16000
-  sincnet:
-    sample_rate: 16000
-    stride: 10
-task:
-  duration: 10.0
-  max_speakers_per_chunk: 3
-  max_speakers_per_frame: 2

 model:
+  _target_: pyannote.audio.models.embedding.wespeaker.WeSpeakerResNet34
+  dither: 0.0
+  frame_length: 25
+  frame_shift: 10
   num_channels: 1
+  num_mel_bins: 80
   sample_rate: 16000
+  use_energy: false
+  window_type: hamming

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cf667e302cb3ad72316803868e2cf007d35d506e4ac6daafdd527dfd69f3fa72
-size 5912144

 version https://git-lfs.github.com/spec/v1
+oid sha256:c6ebcd5526d688deb24b12eaae4774a6d8337c22bf7b7f25c1eaa1c345f6cae5
+size 26644594