Merge branch 'main' of https://huggingface.co/othrif/wav2vec2-large-xlsr-arabic into main
Browse files
README.md
CHANGED
@@ -11,7 +11,7 @@ tags:
|
|
11 |
- xlsr-fine-tuning-week
|
12 |
license: apache-2.0
|
13 |
model-index:
|
14 |
-
- name:
|
15 |
results:
|
16 |
- task:
|
17 |
name: Speech Recognition
|
@@ -87,7 +87,7 @@ processor = Wav2Vec2Processor.from_pretrained("othrif/wav2vec2-large-xlsr-arabic
|
|
87 |
model = Wav2Vec2ForCTC.from_pretrained("othrif/wav2vec2-large-xlsr-arabic")
|
88 |
model.to("cuda")
|
89 |
|
90 |
-
chars_to_ignore_regex = '[
|
91 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
92 |
|
93 |
# Preprocessing the datasets.
|
|
|
11 |
- xlsr-fine-tuning-week
|
12 |
license: apache-2.0
|
13 |
model-index:
|
14 |
+
- name: XLSR Wav2Vec2 Arabic by Othmane Rifki
|
15 |
results:
|
16 |
- task:
|
17 |
name: Speech Recognition
|
|
|
87 |
model = Wav2Vec2ForCTC.from_pretrained("othrif/wav2vec2-large-xlsr-arabic")
|
88 |
model.to("cuda")
|
89 |
|
90 |
+
chars_to_ignore_regex = '[\\\\\\\\؛\\\\\\\\—\\\\\\\\_get\\\\\\\\«\\\\\\\\»\\\\\\\\ـ\\\\\\\\ـ\\\\\\\\,\\\\\\\\?\\\\\\\\.\\\\\\\\!\\\\\\\\-\\\\\\\\;\\\\\\\\:\\\\\\\\"\\\\\\\\“\\\\\\\\%\\\\\\\\‘\\\\\\\\”\\\\\\\\�\\\\\\\\#\\\\\\\\،\\\\\\\\☭,\\\\\\\\؟]'
|
91 |
resampler = torchaudio.transforms.Resample(48_000, 16_000)
|
92 |
|
93 |
# Preprocessing the datasets.
|