add tokenizer
Browse files- vocab.json +1 -1
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"
|
1 |
+
{"u": 0, "c": 1, "i": 2, "n": 3, "v": 4, "m": 5, "r": 6, "b": 7, "p": 8, "k": 9, "q": 10, "e": 11, "h": 12, "y": 13, "a": 15, "t": 16, "d": 17, "x": 18, "l": 19, "f": 20, "z": 21, "o": 22, "g": 23, "'": 24, "w": 25, "s": 26, "j": 27, "|": 14, "[UNK]": 28, "[PAD]": 29}
|