Adding new scores

Files changed (4) hide show

NbAiLab_NPSC_16K_mp3_test_eval_results.txt CHANGED Viewed

eval.py CHANGED Viewed

@@ -65,6 +65,7 @@ def normalize_text(text: str) -> str:
     text = re.sub('<ee>', 'eee', text)
     text = re.sub('<qq>', 'qqq', text)
     text = re.sub('<mm>', 'mmm', text)
     text = re.sub('[<>]', '', text)
     # # In addition, we can normalize the target text, e.g. removing new lines characters etc...
@@ -80,6 +81,7 @@ def normalize_text(text: str) -> str:
 def main(args):
     # load dataset
     dataset = load_dataset(args.dataset, args.config, split=args.split, use_auth_token=True)
     # for testing: only process the first two examples as a test
     # dataset = dataset.select(range(10))

     text = re.sub('<ee>', 'eee', text)
     text = re.sub('<qq>', 'qqq', text)
     text = re.sub('<mm>', 'mmm', text)
+    text = re.sub('<inaudible>', 'xxx', text)
     text = re.sub('[<>]', '', text)
     # # In addition, we can normalize the target text, e.g. removing new lines characters etc...
 def main(args):
     # load dataset
     dataset = load_dataset(args.dataset, args.config, split=args.split, use_auth_token=True)
+    #dataset = load_dataset(args.dataset, args.config, split=args.split, use_auth_token=True).filter(lambda entry: re.search("nb-nn", entry["sentence_language_code"], flags=re.IGNORECASE))
     # for testing: only process the first two examples as a test
     # dataset = dataset.select(range(10))

log_NbAiLab_NPSC_16K_mp3_test_predictions.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

log_NbAiLab_NPSC_16K_mp3_test_targets.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff