bakrianoo commited on
Commit
6742ee9
1 Parent(s): aba15e5

Update Benchmark Table

Browse files
Files changed (1) hide show
  1. README.md +13 -13
README.md CHANGED
@@ -41,15 +41,15 @@ Please install:
41
 
42
  We evaluated the model against different Arabic-STT Wav2Vec models.
43
 
44
- | | model | using_transliation | WER |
45
- |---:|:--------------------------------------|:---------------------|---------:|
46
- | 0 | bakrianoo/sinai-voice-ar-stt | True | 0.238001 |
47
- | 1 | elgeish/wav2vec2-large-xlsr-53-arabic | True | 0.266527 |
48
- | 2 | othrif/wav2vec2-large-xlsr-arabic | True | 0.298122 |
49
- | 3 | bakrianoo/sinai-voice-ar-stt | False | 0.448987 |
50
- | 4 | othrif/wav2vec2-large-xlsr-arabic | False | 0.464004 |
51
- | 5 | anas/wav2vec2-large-xlsr-arabic | True | 0.506191 |
52
- | 6 | anas/wav2vec2-large-xlsr-arabic | False | 0.622288 |
53
 
54
 
55
  <details>
@@ -80,8 +80,8 @@ resamplers = { # all three sampling rates exist in test split
80
  transformation = jiwer.Compose([
81
  # normalize some diacritics, remove punctuation, and replace Persian letters with Arabic ones
82
  jiwer.SubstituteRegexes({
83
- r'[auiFNKo\\~_،؟»\\?;:\\-,\\.؛«!"]': "", "\\u06D6": "",
84
- r"[\\|\\{]": "A", "p": "h", "ک": "k", "ی": "y"}),
85
  # default transformation below
86
  jiwer.RemoveMultipleSpaces(),
87
  jiwer.Strip(),
@@ -274,8 +274,8 @@ test_split = test_split.map(predict, batched=True, batch_size=16, remove_columns
274
  transformation = jiwer.Compose([
275
  # normalize some diacritics, remove punctuation, and replace Persian letters with Arabic ones
276
  jiwer.SubstituteRegexes({
277
- r'[auiFNKo\\\\~_،؟»\\\\?;:\\\\-,\\\\.؛«!"]': "", "\\\\u06D6": "",
278
- r"[\\\\|\\\\{]": "A", "p": "h", "ک": "k", "ی": "y"}),
279
  # default transformation below
280
  jiwer.RemoveMultipleSpaces(),
281
  jiwer.Strip(),
 
41
 
42
  We evaluated the model against different Arabic-STT Wav2Vec models.
43
 
44
+ | | Model | [using transliteration](https://pypi.org/project/lang-trans/) | WER | Train Datasets |
45
+ |---:|:--------------------------------------|:---------------------|---------:|---------:|
46
+ | 1 | bakrianoo/sinai-voice-ar-stt | True | 0.238001 |Common Voice 6|
47
+ | 2 | elgeish/wav2vec2-large-xlsr-53-arabic | True | 0.266527 |Common Voice 6 + Arabic Speech Corpus|
48
+ | 3 | othrif/wav2vec2-large-xlsr-arabic | True | 0.298122 |Common Voice 6|
49
+ | 4 | bakrianoo/sinai-voice-ar-stt | False | 0.448987 |Common Voice 6|
50
+ | 5 | othrif/wav2vec2-large-xlsr-arabic | False | 0.464004 |Common Voice 6|
51
+ | 6 | anas/wav2vec2-large-xlsr-arabic | True | 0.506191 |Common Voice 4|
52
+ | 7 | anas/wav2vec2-large-xlsr-arabic | False | 0.622288 |Common Voice 4|
53
 
54
 
55
  <details>
 
80
  transformation = jiwer.Compose([
81
  # normalize some diacritics, remove punctuation, and replace Persian letters with Arabic ones
82
  jiwer.SubstituteRegexes({
83
+ r'[auiFNKo\\\\~_،؟»\\\\?;:\\\\-,\\\\.؛«!"]': "", "\\\\u06D6": "",
84
+ r"[\\\\|\\\\{]": "A", "p": "h", "ک": "k", "ی": "y"}),
85
  # default transformation below
86
  jiwer.RemoveMultipleSpaces(),
87
  jiwer.Strip(),
 
274
  transformation = jiwer.Compose([
275
  # normalize some diacritics, remove punctuation, and replace Persian letters with Arabic ones
276
  jiwer.SubstituteRegexes({
277
+ r'[auiFNKo\\\\\\\\~_،؟»\\\\\\\\?;:\\\\\\\\-,\\\\\\\\.؛«!"]': "", "\\\\\\\\u06D6": "",
278
+ r"[\\\\\\\\|\\\\\\\\{]": "A", "p": "h", "ک": "k", "ی": "y"}),
279
  # default transformation below
280
  jiwer.RemoveMultipleSpaces(),
281
  jiwer.Strip(),