add models

Files changed (5) hide show

export-onnx.py CHANGED Viewed

@@ -1,5 +1,7 @@
 #!/usr/bin/env python3
 from typing import Any, Dict
 import onnx
@@ -96,6 +98,20 @@ def main():
     receptive_field_size = int(model.receptive_field.duration * 16000)
     receptive_field_shift = int(model.receptive_field.step * 16000)
     meta_data = {
         "num_speakers": len(model.specifications.classes),
         "powerset_max_classes": model.specifications.powerset_max_classes,
@@ -108,9 +124,9 @@ def main():
         "version": "1",
         "model_author": "pyannote",
         "maintainer": "k2-fsa",
-        "url_1": "https://huggingface.co/pyannote/segmentation-3.0",
-        "url_2": "https://huggingface.co/csukuangfj/pyannote-models/tree/main/segmentation-3.0",
-        "license": "https://huggingface.co/pyannote/segmentation-3.0/blob/main/LICENSE",
     }
     add_meta_data(filename=filename, meta_data=meta_data)

 #!/usr/bin/env python3
+# Copyright      2024  Xiaomi Corp.        (authors: Fangjun Kuang)
+import os
 from typing import Any, Dict
 import onnx
     receptive_field_size = int(model.receptive_field.duration * 16000)
     receptive_field_shift = int(model.receptive_field.step * 16000)
+    is_revai = os.getenv("SHERPA_ONNX_IS_REVAI", "")
+    if is_revai == "":
+        url_1 = "https://huggingface.co/pyannote/segmentation-3.0"
+        url_2 = "https://huggingface.co/csukuangfj/pyannote-models/tree/main/segmentation-3.0"
+        license_url = (
+            "https://huggingface.co/pyannote/segmentation-3.0/blob/main/LICENSE"
+        )
+    else:
+        url_1 = "https://huggingface.co/Revai/reverb-diarization-v1"
+        url_2 = "https://huggingface.co/csukuangfj/sherpa-onnx-reverb-diarization-v1"
+        license_url = (
+            "https://huggingface.co/Revai/reverb-diarization-v1/blob/main/LICENSE"
+        )
     meta_data = {
         "num_speakers": len(model.specifications.classes),
         "powerset_max_classes": model.specifications.powerset_max_classes,
         "version": "1",
         "model_author": "pyannote",
         "maintainer": "k2-fsa",
+        "url_1": url_1,
+        "url_2": url_2,
+        "license": license_url,
     }
     add_meta_data(filename=filename, meta_data=meta_data)

model.int8.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c0e83b2ca69b379eea37b80e2b739b1f6e43f3964c95aaac0bdeb5e2e225ec6e
-size 2415974

 version https://git-lfs.github.com/spec/v1
+oid sha256:eba77d4d983fd37d8cc0864b10b63bcd0c1864633b2917fb0d2aeb4b6055cf23
+size 2415969

model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d4d3926911a214a1e56df418f8d967f6dee3e139348a0738b6ef982fb3108fd4
-size 9512165

 version https://git-lfs.github.com/spec/v1
+oid sha256:08a5eb1dff82847656baa7bf022c85bd9c90dd5a6a1f1b06f3ebfca0482beb5a
+size 9512160

run.sh CHANGED Viewed

@@ -1,6 +1,8 @@
 #!/usr/bin/env bash
 # Copyright    2024  Xiaomi Corp.        (authors: Fangjun Kuang)
 set -ex
 function install_pyannote() {
   pip install pyannote.audio onnx onnxruntime

 #!/usr/bin/env bash
 # Copyright    2024  Xiaomi Corp.        (authors: Fangjun Kuang)
+export SHERPA_ONNX_IS_REVAI=1
 set -ex
 function install_pyannote() {
   pip install pyannote.audio onnx onnxruntime

speaker-diarization-torch.py CHANGED Viewed

@@ -1,4 +1,5 @@
 #!/usr/bin/env python3
 """
 Please refer to

 #!/usr/bin/env python3
+# Copyright      2024  Xiaomi Corp.        (authors: Fangjun Kuang)
 """
 Please refer to