yaswanth commited on
Commit
d68a397
1 Parent(s): 156f0af

add tokenizer

Browse files
Files changed (2) hide show
  1. added_tokens.json +1 -1
  2. vocab.json +1 -1
added_tokens.json CHANGED
@@ -1 +1 @@
1
- {"<s>": 98, "</s>": 99}
 
1
+ {"<s>": 95, "</s>": 96}
vocab.json CHANGED
@@ -1 +1 @@
1
- {"": 0, "e": 1, "": 2, "": 3, "": 4, "": 5, "": 6, "": 7, "": 8, "": 9, "v": 10, "'": 11, "": 12, "": 13, "": 14, "o": 15, "ँ": 16, "": 17, "": 18, "": 20, "": 21, "": 22, "h": 23, "t": 24, "": 25, "": 26, "": 27, "p": 28, "": 29, "": 30, "w": 31, "": 32, "": 33, "r": 34, "n": 35, "": 36, "": 37, "": 38, "g": 39, "": 40, "": 41, "": 42, "": 43, "d": 44, "": 45, "": 46, "q": 47, "": 48, "f": 49, "": 50, "": 51, "": 52, "s": 53, "j": 54, "i": 55, "": 56, "x": 57, "": 58, "": 59, "": 60, "": 61, "": 62, "": 63, "": 64, "": 65, "ि": 66, "k": 67, "m": 68, "": 69, "": 70, "": 71, "l": 72, "b": 73, "": 74, "u": 75, "c": 76, "": 77, "": 78, "": 79, "": 80, "": 81, "": 82, "": 83, "": 84, "y": 85, "z": 86, "": 87, "": 88, "": 89, "": 90, "": 91, "a": 92, "ौ": 93, "व": 94, "ं": 95, "|": 19, "[UNK]": 96, "[PAD]": 97}
 
1
+ {"": 0, "y": 1, "": 2, "": 3, "o": 4, "": 5, "": 6, "v": 7, "": 8, "": 10, "": 11, "": 12, "'": 13, "": 14, "": 15, "ँ": 16, "m": 17, "": 18, "": 19, "स": 20, "": 21, "d": 22, "": 23, "": 24, "": 25, "": 26, "": 27, "z": 28, "h": 29, "": 30, "": 31, "": 32, "e": 33, "": 34, "": 35, "": 36, "b": 37, "": 38, "p": 39, "": 40, "l": 41, "u": 42, "g": 43, "": 44, "n": 45, "s": 46, "": 47, "": 48, "": 49, "": 50, "": 51, "": 52, "": 53, "": 54, "t": 55, "k": 56, "": 57, "": 58, "": 59, "": 60, "": 61, "": 62, "": 63, "": 64, "i": 65, "": 66, "": 67, "f": 68, "": 69, "": 70, "a": 71, "j": 72, "ि": 73, "": 74, "": 75, "": 76, "w": 77, "": 78, "": 79, "": 80, "c": 81, "": 82, "": 83, "": 84, "": 85, "r": 86, "": 87, "x": 88, "": 89, "": 90, "": 91, "": 92, "|": 9, "[UNK]": 93, "[PAD]": 94}