updated the eval script with the result

Files changed (4) hide show

eval.py CHANGED Viewed

@@ -50,9 +50,12 @@ def log_results(result: Dataset, args: Dict[str, str]):
 def normalize_text(text: str) -> str:
     """DO ADAPT FOR YOUR USE CASE. this function normalizes the target text."""
-    chars_to_ignore_regex = '[,?.!\-\;\:"“%‘”�—’…–]'  # noqa: W605 IMPORTANT: this should correspond to the chars that were ignored during training
     text = re.sub(chars_to_ignore_regex, "", text.lower())
     # In addition, we can normalize the target text, e.g. removing new lines characters etc...
     # note that order is important here!

 def normalize_text(text: str) -> str:
     """DO ADAPT FOR YOUR USE CASE. this function normalizes the target text."""
+    chars_to_ignore_regex = '[,?.!-;:""%\'"�\'‘’_，！łńō–—\\\\\\“”\\[\\]]'
     text = re.sub(chars_to_ignore_regex, "", text.lower())
+    text = re.sub(r'[‘’´`]', r"'", text)
+    text = re.sub(r'è', r"é", text)
+    text = re.sub(r"(-|' | '|  +)", " ", text)
     # In addition, we can normalize the target text, e.g. removing new lines characters etc...
     # note that order is important here!

log_mozilla-foundation_common_voice_7_0_id_test_predictions.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

log_mozilla-foundation_common_voice_7_0_id_test_targets.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

mozilla-foundation_common_voice_7_0_id_test_eval_results.txt ADDED Viewed