yaswanth commited on
Commit
156f0af
1 Parent(s): 2788e80

add tokenizer

Browse files
Files changed (2) hide show
  1. added_tokens.json +1 -1
  2. vocab.json +1 -1
added_tokens.json CHANGED
@@ -1 +1 @@
1
- {"<s>": 95, "</s>": 96}
 
1
+ {"<s>": 98, "</s>": 99}
vocab.json CHANGED
@@ -1 +1 @@
1
- {"ऐ": 0, "e": 1, "ऊ": 2, "इ": 3, "ल": 4, "उ": 5, "ॉ": 6, "य": 7, "ः": 8, "ू": 9, "v": 10, "'": 11, "म": 12, "ऋ": 13, "ा": 14, "o": 15, "ँ": 16, "ज": 17, "औ": 18, "़": 20, "क़": 21, "ग": 22, "h": 23, "t": 24, "भ": 25, "ग़": 26, "घ": 27, "p": 28, "ध": 29, "र": 30, "w": 31, "ै": 32, "च": 33, "r": 34, "n": 35, "े": 36, "ठ": 37, "ढ": 38, "g": 39, "अ": 40, "ी": 41, "ड़": 42, "ओ": 43, "d": 44, "ण": 45, "क": 46, "": 47, "f": 48, "": 49, "": 50, "": 51, "s": 52, "j": 53, "i": 54, "": 55, "x": 56, "": 57, "": 58, "": 59, "": 60, "": 61, "": 62, "": 63, "ि": 64, "k": 65, "m": 66, "": 67, "": 68, "": 69, "l": 70, "b": 71, "": 72, "u": 73, "c": 74, "": 75, "": 76, "": 77, "": 78, "": 79, "": 80, "": 81, "y": 82, "z": 83, "": 84, "": 85, "": 86, "": 87, "": 88, "a": 89, "": 90, "": 91, "": 92, "|": 19, "[UNK]": 93, "[PAD]": 94}
 
1
+ {"ऐ": 0, "e": 1, "ऊ": 2, "इ": 3, "ल": 4, "उ": 5, "ॉ": 6, "य": 7, "ः": 8, "ू": 9, "v": 10, "'": 11, "म": 12, "ऋ": 13, "ा": 14, "o": 15, "ँ": 16, "ज": 17, "औ": 18, "़": 20, "क़": 21, "ग": 22, "h": 23, "t": 24, "भ": 25, "ग़": 26, "घ": 27, "p": 28, "ध": 29, "र": 30, "w": 31, "ै": 32, "च": 33, "r": 34, "n": 35, "े": 36, "ठ": 37, "ढ": 38, "g": 39, "अ": 40, "ी": 41, "ड़": 42, "ओ": 43, "d": 44, "ण": 45, "क": 46, "q": 47, "": 48, "f": 49, "": 50, "": 51, "": 52, "s": 53, "j": 54, "i": 55, "": 56, "x": 57, "": 58, "": 59, "": 60, "": 61, "": 62, "": 63, "": 64, "": 65, "ि": 66, "k": 67, "m": 68, "": 69, "": 70, "": 71, "l": 72, "b": 73, "": 74, "u": 75, "c": 76, "": 77, "": 78, "": 79, "": 80, "": 81, "": 82, "": 83, "": 84, "y": 85, "z": 86, "": 87, "": 88, "": 89, "": 90, "": 91, "a": 92, "ौ": 93, "व": 94, "ं": 95, "|": 19, "[UNK]": 96, "[PAD]": 97}