bakrianoo commited on
Commit
7aa1354
1 Parent(s): 6742ee9

fix a minor instruction

Browse files
Files changed (1) hide show
  1. README.md +6 -6
README.md CHANGED
@@ -80,8 +80,8 @@ resamplers = { # all three sampling rates exist in test split
80
  transformation = jiwer.Compose([
81
  # normalize some diacritics, remove punctuation, and replace Persian letters with Arabic ones
82
  jiwer.SubstituteRegexes({
83
- r'[auiFNKo\\\\~_،؟»\\\\?;:\\\\-,\\\\.؛«!"]': "", "\\\\u06D6": "",
84
- r"[\\\\|\\\\{]": "A", "p": "h", "ک": "k", "ی": "y"}),
85
  # default transformation below
86
  jiwer.RemoveMultipleSpaces(),
87
  jiwer.Strip(),
@@ -108,12 +108,12 @@ def predict(batch):
108
  # prepare the test dataset
109
  test_split = test_split.map(prepare_example)
110
 
111
- stt_models = {
112
  "elgeish/wav2vec2-large-xlsr-53-arabic",
113
  "othrif/wav2vec2-large-xlsr-arabic",
114
  "anas/wav2vec2-large-xlsr-arabic",
115
  "bakrianoo/sinai-voice-ar-stt"
116
- }
117
 
118
  stt_results = []
119
 
@@ -274,8 +274,8 @@ test_split = test_split.map(predict, batched=True, batch_size=16, remove_columns
274
  transformation = jiwer.Compose([
275
  # normalize some diacritics, remove punctuation, and replace Persian letters with Arabic ones
276
  jiwer.SubstituteRegexes({
277
- r'[auiFNKo\\\\\\\\~_،؟»\\\\\\\\?;:\\\\\\\\-,\\\\\\\\.؛«!"]': "", "\\\\\\\\u06D6": "",
278
- r"[\\\\\\\\|\\\\\\\\{]": "A", "p": "h", "ک": "k", "ی": "y"}),
279
  # default transformation below
280
  jiwer.RemoveMultipleSpaces(),
281
  jiwer.Strip(),
 
80
  transformation = jiwer.Compose([
81
  # normalize some diacritics, remove punctuation, and replace Persian letters with Arabic ones
82
  jiwer.SubstituteRegexes({
83
+ r'[auiFNKo\\\\\\\\~_،؟»\\\\\\\\?;:\\\\\\\\-,\\\\\\\\.؛«!"]': "", "\\\\\\\\u06D6": "",
84
+ r"[\\\\\\\\|\\\\\\\\{]": "A", "p": "h", "ک": "k", "ی": "y"}),
85
  # default transformation below
86
  jiwer.RemoveMultipleSpaces(),
87
  jiwer.Strip(),
 
108
  # prepare the test dataset
109
  test_split = test_split.map(prepare_example)
110
 
111
+ stt_models = [
112
  "elgeish/wav2vec2-large-xlsr-53-arabic",
113
  "othrif/wav2vec2-large-xlsr-arabic",
114
  "anas/wav2vec2-large-xlsr-arabic",
115
  "bakrianoo/sinai-voice-ar-stt"
116
+ ]
117
 
118
  stt_results = []
119
 
 
274
  transformation = jiwer.Compose([
275
  # normalize some diacritics, remove punctuation, and replace Persian letters with Arabic ones
276
  jiwer.SubstituteRegexes({
277
+ r'[auiFNKo\\\\\\\\\\\\\\\\~_،؟»\\\\\\\\\\\\\\\\?;:\\\\\\\\\\\\\\\\-,\\\\\\\\\\\\\\\\.؛«!"]': "", "\\\\\\\\\\\\\\\\u06D6": "",
278
+ r"[\\\\\\\\\\\\\\\\|\\\\\\\\\\\\\\\\{]": "A", "p": "h", "ک": "k", "ی": "y"}),
279
  # default transformation below
280
  jiwer.RemoveMultipleSpaces(),
281
  jiwer.Strip(),