nvidia
/

stt_en_citrinet_1024_gamma_0_25

@@ -10,7 +10,6 @@ datasets:
 - WSJ-1
 - National Singapore Corpus Part 1
 - National Singapore Corpus Part 6
-- mozilla-foundation/common_voice_7_0
 thumbnail: null
 tags:
 - automatic-speech-recognition
@@ -45,7 +44,7 @@ model-index:
     metrics:
     - name: Test WER
       type: wer
-      value: 2.2
   - task:
       type: Automatic Speech Recognition
       name: automatic-speech-recognition
@@ -59,49 +58,7 @@ model-index:
     metrics:
     - name: Test WER
       type: wer
-      value: 4.3
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: Multilingual LibriSpeech
-      type: facebook/multilingual_librispeech
-      config: english
-      split: test
-      args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 7.2
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: Mozilla Common Voice 7.0
-      type: mozilla-foundation/common_voice_7_0
-      config: en
-      split: test
-      args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 8.0
-  - task:
-      type: Automatic Speech Recognition
-      name: automatic-speech-recognition
-    dataset:
-      name: Mozilla Common Voice 8.0
-      type: mozilla-foundation/common_voice_8_0
-      config: en
-      split: test
-      args:
-        language: en
-    metrics:
-    - name: Test WER
-      type: wer
-      value: 9.48
   - task:
       type: Automatic Speech Recognition
       name: automatic-speech-recognition
@@ -113,7 +70,7 @@ model-index:
     metrics:
     - name: Test WER
       type: wer
-      value: 2.0
   - task:
       type: Automatic Speech Recognition
       name: automatic-speech-recognition
@@ -125,7 +82,7 @@ model-index:
     metrics:
     - name: Test WER
       type: wer
-      value: 2.9
   - task:
       type: Automatic Speech Recognition
       name: automatic-speech-recognition
@@ -137,7 +94,7 @@ model-index:
     metrics:
     - name: Test WER
       type: wer
-      value: 7.0
 ---
 # NVIDIA Streaming Citrinet 1024 (en-US)
@@ -222,7 +179,6 @@ All the models in this collection are trained on a composite dataset (NeMo ASRSE
 - Switchboard-1 Dataset
 - WSJ-0 and WSJ-1
 - National Speech Corpus (Part 1, Part 6)
-- Mozilla Common Voice (v7.0)
 Note: older versions of the model may have trained on smaller set of datasets.

 - WSJ-1
 - National Singapore Corpus Part 1
 - National Singapore Corpus Part 6
 thumbnail: null
 tags:
 - automatic-speech-recognition
     metrics:
     - name: Test WER
       type: wer
+      value: 3.4
   - task:
       type: Automatic Speech Recognition
       name: automatic-speech-recognition
     metrics:
     - name: Test WER
       type: wer
+      value: 7.6
   - task:
       type: Automatic Speech Recognition
       name: automatic-speech-recognition
     metrics:
     - name: Test WER
       type: wer
+      value: 2.5
   - task:
       type: Automatic Speech Recognition
       name: automatic-speech-recognition
     metrics:
     - name: Test WER
       type: wer
+      value: 4.0
   - task:
       type: Automatic Speech Recognition
       name: automatic-speech-recognition
     metrics:
     - name: Test WER
       type: wer
+      value: 6.2
 ---
 # NVIDIA Streaming Citrinet 1024 (en-US)
 - Switchboard-1 Dataset
 - WSJ-0 and WSJ-1
 - National Speech Corpus (Part 1, Part 6)
 Note: older versions of the model may have trained on smaller set of datasets.