jawaharreddy247 commited on
Commit
ecef9a7
1 Parent(s): 5b3ac10

add tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +1 -1
vocab.json CHANGED
@@ -1 +1 @@
1
- {"": 0, "": 1, "": 2, "": 3, "": 4, "": 5, "": 6, "": 7, "": 8, "f": 9, "": 10, "": 11, "": 12, "": 13, "": 14, "": 15, "": 16, "p": 17, "": 18, "": 19, "": 20, "": 21, "ि": 22, "": 23, "": 24, "": 25, "": 26, "e": 27, "": 28, "u": 29, "": 30, "w": 31, "": 32, "m": 33, "r": 34, "": 35, "": 36, "": 37, "": 38, "": 39, "": 41, "i": 42, "": 43, "": 44, "": 45, "": 46, "": 47, "": 48, "a": 49, "": 50, "": 51, "": 52, "": 53, "": 54, "": 55, "l": 56, "": 57, "": 58, "'": 59, "": 60, "": 61, "": 62, "": 63, "": 64, "": 65, "": 66, "़": 67, "": 68, "": 69, "": 70, "": 71, "|": 40, "[UNK]": 72, "[PAD]": 73}
1
+ {"": 0, "": 1, "": 2, "p": 3, "": 4, "": 5, "": 6, "r": 7, "a": 8, "e": 9, "": 10, "": 11, "": 12, "": 13, "": 14, "": 15, "": 16, "": 17, "": 18, "": 19, "": 20, "'": 21, "": 22, "": 23, "": 24, "": 25, "": 26, "": 27, "w": 29, "ि": 30, "": 31, "": 32, "": 33, "": 34, "": 35, "": 36, "": 37, "": 38, "": 39, "": 40, "।": 41, "f": 42, "": 43, "": 44, "": 45, "": 46, "": 47, "": 48, "": 49, "": 50, "": 51, "u": 52, "m": 53, "": 54, "": 55, "": 56, "": 57, "": 58, "": 59, "": 60, "i": 61, "": 62, "l": 63, "": 64, "": 65, "": 66, "़": 67, "": 68, "": 69, "": 70, "": 71, "|": 28}