Update eval.py
Browse files
eval.py
CHANGED
@@ -130,9 +130,9 @@ def normalize_text(original_text: str, dataset: str) -> str:
|
|
130 |
text = re.sub('[úùüû]', 'u', text)
|
131 |
text = re.sub('[«»]', '', text)
|
132 |
text = re.sub('\s+', ' ', text)
|
133 |
-
text = re.sub('<
|
134 |
-
text = re.sub('<
|
135 |
-
text = re.sub('<
|
136 |
text = re.sub('<inaudible>', 'xxx', text)
|
137 |
text = re.sub('[<>]', '', text)
|
138 |
|
|
|
130 |
text = re.sub('[úùüû]', 'u', text)
|
131 |
text = re.sub('[«»]', '', text)
|
132 |
text = re.sub('\s+', ' ', text)
|
133 |
+
text = re.sub('<e+h?>', 'eee', text)
|
134 |
+
text = re.sub('<m+>', 'mmm', text)
|
135 |
+
text = re.sub('<q+>', 'qqq', text)
|
136 |
text = re.sub('<inaudible>', 'xxx', text)
|
137 |
text = re.sub('[<>]', '', text)
|
138 |
|