nikhil6041 commited on
Commit
4a848a7
1 Parent(s): 618dc99

add tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +1 -1
vocab.json CHANGED
@@ -1 +1 @@
1
- {"": 0, "": 1, "": 2, "": 3, "": 4, "W": 5, "": 6, "": 7, "": 8, "": 9, "": 10, "": 11, "": 12, "": 13, "": 14, "l": 15, "": 16, "": 17, "": 18, "F": 19, ":": 20, "": 21, "": 22, "": 23, "": 24, "": 25, "": 26, "": 27, "": 28, "": 29, "-": 30, "i": 31, "": 32, "r": 33, "?": 34, "": 35, "!": 36, "": 37, "": 38, "": 39, "": 40, "a": 41, "": 42, "": 43, "": 44, "m": 45, "p": 46, "": 47, "": 48, ",": 49, "": 50, "": 51, "": 52, "": 53, "\"": 54, "": 55, "'": 56, "": 57, "": 58, "": 59, ".": 60, "": 61, "": 62, "": 63, "ि": 64, "": 65, "": 66, "": 67, "": 68, "e": 69, "": 70, "u": 71, "": 72, "": 73, "": 74, "M": 75, "": 76, "": 77, "": 79, "|": 78, "[UNK]": 80, "[PAD]": 81}
 
1
+ {"": 0, "l": 1, "": 2, "!": 3, "p": 4, "": 5, "": 6, "": 7, "": 8, "": 9, "F": 10, "": 11, "": 12, "": 13, "": 14, "": 15, "": 16, "": 17, "": 18, "": 19, "a": 20, "": 21, "": 22, "": 23, "u": 24, "": 25, "": 26, ",": 27, "": 28, "": 29, "": 30, "": 31, "": 32, "": 33, "": 34, ":": 35, "m": 36, "r": 37, "": 38, ".": 39, "": 40, "": 41, "M": 42, "": 43, "": 44, "": 45, "": 46, "": 47, "": 48, "": 49, "": 50, "": 51, "": 52, "?": 53, "": 54, "i": 55, "": 56, "": 57, "": 58, "e": 59, "": 60, "'": 61, "": 62, "": 63, "-": 64, "ि": 65, "": 66, "": 67, "\"": 68, "W": 69, "": 70, "": 71, "": 72, "": 73, "": 74, "": 75, "": 76, "": 77, "": 78, "|": 79, "[UNK]": 80, "[PAD]": 81}