add tokenizer
Browse files- vocab.json +1 -1
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"
|
|
|
1 |
+
{"ऊ": 0, "g": 1, "ए": 2, "फ": 3, "क": 4, "श": 5, "f": 6, "t": 7, "व": 8, "क़": 9, "c": 10, "ट": 11, "ष": 12, "v": 13, "झ": 14, "ल": 15, "आ": 16, "j": 17, "ह": 18, "ृ": 19, "l": 20, "z": 21, "ू": 22, "a": 23, "अ": 24, "s": 25, "ॅ": 26, "ज़": 27, "o": 28, "ः": 29, "n": 30, "k": 31, "र": 32, "x": 33, "्": 34, "य": 35, "u": 36, "i": 37, "ढ": 38, "ा": 39, "r": 40, "इ": 41, "p": 42, "छ": 43, "ॉ": 44, "थ": 45, "ओ": 46, "े": 47, "च": 48, "ब": 49, "ऑ": 50, "m": 52, "ठ": 53, "ि": 54, "ख": 55, "ं": 56, "ु": 57, "ो": 58, "ौ": 59, "y": 60, "उ": 61, "न": 62, "ज": 63, "ण": 64, "ड़": 65, "w": 66, "ञ": 67, "द": 68, "त": 69, "e": 70, "ध": 71, "'": 72, "़": 73, "ग": 74, "म": 75, "ऋ": 76, "ी": 77, "भ": 78, "प": 79, "d": 80, "ै": 81, "ऐ": 82, "ग़": 83, "घ": 84, "ई": 85, "ँ": 86, "स": 87, "h": 88, "औ": 89, "ढ़": 90, "b": 91, "ड": 92, "|": 51, "[UNK]": 93, "[PAD]": 94}
|