PereLluis13 commited on
Commit
ed38cca
1 Parent(s): abcd896

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -2
README.md CHANGED
@@ -80,14 +80,15 @@ from datasets import load_dataset, load_metric
80
  from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
81
  import re
82
 
83
- test_dataset = load_dataset("common_voice", "el", split="test") #TODO: replace {lang_id} in your language code here. Make sure the code is one of the *ISO codes* of [this](https://huggingface.co/languages) site.
84
  wer = load_metric("wer")
85
 
86
  processor = Wav2Vec2Processor.from_pretrained("PereLluis13/wav2vec2-large-xlsr-53-greek")
87
  model = Wav2Vec2ForCTC.from_pretrained("PereLluis13/wav2vec2-large-xlsr-53-greek")
88
  model.to("cuda")
89
 
90
- chars_to_ignore_regex = '[\\\\\\\\,\\\\\\\\?\\\\\\\\.\\\\\\\\!\\\\\\\\-\\\\\\\\;\\\\\\\\:\\\\\\\\"\\\\\\\\“\\\\\\\\%\\\\\\\\'\\\\\\\\�]'
 
91
 
92
  resampler = torchaudio.transforms.Resample(48_000, 16_000)
93
 
80
  from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
81
  import re
82
 
83
+ test_dataset = load_dataset("common_voice", "el", split="test")
84
  wer = load_metric("wer")
85
 
86
  processor = Wav2Vec2Processor.from_pretrained("PereLluis13/wav2vec2-large-xlsr-53-greek")
87
  model = Wav2Vec2ForCTC.from_pretrained("PereLluis13/wav2vec2-large-xlsr-53-greek")
88
  model.to("cuda")
89
 
90
+ chars_to_ignore_regex = '[\\\\,\\\\?\\\\.\\\\!\\\\-\\\\;\\\\:\\\\"\\\\“\\\\%\\\\‘\\\\”\\\\�]'
91
+
92
 
93
  resampler = torchaudio.transforms.Resample(48_000, 16_000)
94