m3hrdadfi
/

wav2vec2-large-xlsr-estonian

Automatic Speech Recognition

xlsr-fine-tuning-week

Inference Endpoints

Model card Files Files and versions Community

m3hrdadfi commited on Mar 28, 2021

Commit

52e3b9f

·

1 Parent(s): 74340bf

Update README.md

Files changed (1) hide show

README.md +6 -6

README.md CHANGED Viewed

@@ -26,7 +26,7 @@ model-index:
     metrics:
        - name: Test WER
          type: wer
-         value: 33.73
 ---
@@ -68,7 +68,7 @@ chars_to_ignore = [
     "“", "%", "‘", "�", "–", "…", "_", "”", '“', '„'
 ]
 chars_to_mapping = {
-"\\u200c": " ", "\\u200d": " ", "\\u200e": " ", "\\u200f": " ", "\\ufeff": " ",
 }
 def multiple_replace(text, chars_to_mapping):
@@ -83,7 +83,7 @@ def normalizer(batch, chars_to_ignore, chars_to_mapping):
     chars_to_ignore_regex = f"""[{"".join(chars_to_ignore)}]"""
     text = batch["sentence"].lower().strip()
-    text = text.replace("\\u0307", " ").strip()
     text = multiple_replace(text, chars_to_mapping)
     text = remove_special_characters(text, chars_to_ignore_regex)
@@ -194,7 +194,7 @@ chars_to_ignore = [
     "“", "%", "‘", "�", "–", "…", "_", "”", '“', '„'
 ]
 chars_to_mapping = {
-    "\\u200c": " ", "\\u200d": " ", "\\u200e": " ", "\\u200f": " ", "\\ufeff": " ",
 }
 def multiple_replace(text, chars_to_mapping):
@@ -209,7 +209,7 @@ def normalizer(batch, chars_to_ignore, chars_to_mapping):
     chars_to_ignore_regex = f"""[{"".join(chars_to_ignore)}]"""
     text = batch["sentence"].lower().strip()
-    text = text.replace("\\u0307", " ").strip()
     text = multiple_replace(text, chars_to_mapping)
     text = remove_special_characters(text, chars_to_ignore_regex)
@@ -261,7 +261,7 @@ print("WER: {:.2f}".format(100 * wer.compute(predictions=result["predicted"], re
 ```
 **Test Result**:
-- WER: 33.73%
 ## Training & Report

     metrics:
        - name: Test WER
          type: wer
+         value: 33.93
 ---
     "“", "%", "‘", "�", "–", "…", "_", "”", '“', '„'
 ]
 chars_to_mapping = {
+"\\\\u200c": " ", "\\\\u200d": " ", "\\\\u200e": " ", "\\\\u200f": " ", "\\\\ufeff": " ",
 }
 def multiple_replace(text, chars_to_mapping):
     chars_to_ignore_regex = f"""[{"".join(chars_to_ignore)}]"""
     text = batch["sentence"].lower().strip()
+    text = text.replace("\\\\u0307", " ").strip()
     text = multiple_replace(text, chars_to_mapping)
     text = remove_special_characters(text, chars_to_ignore_regex)
     "“", "%", "‘", "�", "–", "…", "_", "”", '“', '„'
 ]
 chars_to_mapping = {
+    "\\\\u200c": " ", "\\\\u200d": " ", "\\\\u200e": " ", "\\\\u200f": " ", "\\\\ufeff": " ",
 }
 def multiple_replace(text, chars_to_mapping):
     chars_to_ignore_regex = f"""[{"".join(chars_to_ignore)}]"""
     text = batch["sentence"].lower().strip()
+    text = text.replace("\\\\u0307", " ").strip()
     text = multiple_replace(text, chars_to_mapping)
     text = remove_special_characters(text, chars_to_ignore_regex)
 ```
 **Test Result**:
+- WER: 33.93%
 ## Training & Report