AlexN
/

xls-r-300m-fr

Automatic Speech Recognition

Generated from Trainer

hf-asr-leaderboard

mozilla-foundation/common_voice_8_0

robust-speech-event

Inference Endpoints

Model card Files Files and versions Community

AlexN commited on Jan 28, 2022

Commit

6c5f6a4

•

1 Parent(s): 7132467

bbaguette

Files changed (2) hide show

eval.py +1 -1
run_speech_recognition_ctc.py +1 -1

eval.py CHANGED Viewed

@@ -102,7 +102,7 @@ def main(args):
     # map function to decode audio
     def map_to_pred(batch):
         prediction = asr(
-            batch["audio"]["array"], chunk_length_s=args.chunk_length_s, stride_length_s=args.stride_length_s,,skip_special_tokens=True
         )
         batch["prediction"] = prediction["text"]# "".join(prediction["text"].split("<s>"))

     # map function to decode audio
     def map_to_pred(batch):
         prediction = asr(
+            batch["audio"]["array"], chunk_length_s=args.chunk_length_s, stride_length_s=args.stride_length_s
         )
         batch["prediction"] = prediction["text"]# "".join(prediction["text"].split("<s>"))

run_speech_recognition_ctc.py CHANGED Viewed

@@ -643,7 +643,7 @@ def main():
         pred.label_ids[pred.label_ids == -100] = tokenizer.pad_token_id
-        pred_str = tokenizer.batch_decode(pred_ids, skip_special_tokens=True)
         # we do not want to group tokens when computing the metrics
         label_str = tokenizer.batch_decode(pred.label_ids, group_tokens=False)

         pred.label_ids[pred.label_ids == -100] = tokenizer.pad_token_id
+        pred_str = tokenizer.batch_decode(pred_ids)
         # we do not want to group tokens when computing the metrics
         label_str = tokenizer.batch_decode(pred.label_ids, group_tokens=False)