Elaine Mary Rose commited on
Commit
2c4f851
1 Parent(s): 076b4d0
preprocessor_config.json CHANGED
@@ -5,5 +5,6 @@
5
  "padding_side": "right",
6
  "padding_value": 0.0,
7
  "return_attention_mask": true,
8
- "sampling_rate": 16000
 
9
  }
 
5
  "padding_side": "right",
6
  "padding_value": 0.0,
7
  "return_attention_mask": true,
8
+ "sampling_rate": 16000,
9
+ "processor_class": Wav2Vec2Processor
10
  }
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "<pad>", "do_lower_case": false, "word_delimiter_token": "|", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
vocab.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"\u0d1c": 0, "\u0d1f": 1, "s": 2, "l": 3, "\u0d13": 4, "\u0d22": 5, "\u0d2d": 6, "v": 7, "\u0d27": 8, "\u0d18": 9, "\u0d07": 10, "g": 11, "\u0d41": 12, "k": 13, "\u0d15": 14, "\u0d1e": 15, "\u0d7a": 16, "e": 17, "y": 18, "\u0d08": 19, "\u0d23": 20, "\u0d2f": 21, "\u0d06": 22, "i": 23, "\u0d40": 24, "\u0d36": 25, "\u0d7c": 26, "\u0d35": 27, "\u0d7b": 28, "\u0d4a": 29, "j": 30, "\u0d0f": 31, "\u0d34": 32, "u": 33, "\u0d12": 34, "\u0d7d": 35, "\u0d42": 36, "r": 37, "t": 38, "\u0d43": 39, "\u0d2c": 40, "\u0d3f": 41, "d": 42, "\u0d28": 43, "a": 44, "\u0d46": 45, "\u0d31": 46, "\u0d17": 47, "q": 48, "\u0d7e": 49, "m": 50, "b": 51, "\u0d4b": 52, "x": 53, "\u0d48": 54, "\u0d1b": 55, "\u0d2b": 56, "\u0d1a": 57, "f": 58, "\u0d30": 59, "\u0d37": 60, "\u0d02": 61, "h": 62, "\u0d26": 64, "w": 65, "\u0d2a": 66, "c": 67, "n": 68, "\u0d24": 69, "\u0d39": 70, "\u0d0e": 71, "\u0d05": 72, "\u0d2e": 73, "\u0d33": 74, "o": 75, "\u0d09": 76, "\u0d20": 77, "\u0d25": 78, "\u0d4d": 79, "\u0d57": 80, "\u0d21": 81, "z": 82, "\u0d38": 83, "\u0d47": 84, "\u0d10": 85, "\u0d0a": 86, "p": 87, "\u0d19": 88, "\u0d3e": 89, "\u0d16": 90, "\u0d32": 91, "|": 63, "[UNK]": 92, "[PAD]": 93}