Mahalakshmi
commited on
Commit
•
7446891
1
Parent(s):
1533a44
add tokenizer
Browse files- vocab.json +1 -1
vocab.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"
|
|
|
1 |
+
{"ீ": 0, "'": 1, "ு": 2, "த": 3, "ஞ": 4, "ி": 5, "ய": 6, "உ": 7, "ஒ": 8, "ை": 9, "ோ": 10, "ா": 11, "ஜ": 12, "ம": 13, "ஈ": 14, "ழ": 15, "ஏ": 16, "ல": 17, "ங": 18, "ள": 19, "ொ": 20, "ப": 21, "ஃ": 22, "ஆ": 23, "ூ": 24, "்": 25, "ௌ": 26, "ட": 27, "ஐ": 28, "அ": 29, "’": 30, "ெ": 31, "ற": 32, "ண": 33, "ச": 34, "வ": 35, "ஸ": 36, "ஔ": 37, "ன": 38, "ஷ": 39, "ஓ": 40, "ர": 41, "எ": 42, "ே": 44, "ஊ": 45, "ஹ": 46, "ந": 47, "இ": 48, "க": 49, "|": 43, "[UNK]": 50, "[PAD]": 51}
|