Upload tokenizer
b54a4ac
verified
|
{ |
|
"&": 1, |
|
"(": 2, |
|
")": 3, |
|
"[PAD]": 65, |
|
"[UNK]": 64, |
|
"_": 4, |
|
"`": 5, |
|
"|": 0, |
|
"·": 6, |
|
"ஃ": 7, |
|
"அ": 8, |
|
"ஆ": 9, |
|
"இ": 10, |
|
"ஈ": 11, |
|
"உ": 12, |
|
"ஊ": 13, |
|
"எ": 14, |
|
"ஏ": 15, |
|
"ஐ": 16, |
|
"ஒ": 17, |
|
"ஓ": 18, |
|
"ஔ": 19, |
|
"க": 20, |
|
"ங": 21, |
|
"ச": 22, |
|
"ஜ": 23, |
|
"ஞ": 24, |
|
"ட": 25, |
|
"ண": 26, |
|
"த": 27, |
|
"ந": 28, |
|
"ன": 29, |
|
"ப": 30, |
|
"ம": 31, |
|
"ய": 32, |
|
"ர": 33, |
|
"ற": 34, |
|
"ல": 35, |
|
"ள": 36, |
|
"ழ": 37, |
|
"வ": 38, |
|
"ஷ": 39, |
|
"ஸ": 40, |
|
"ஹ": 41, |
|
"ா": 42, |
|
"ி": 43, |
|
"ீ": 44, |
|
"ு": 45, |
|
"ூ": 46, |
|
"ெ": 47, |
|
"ே": 48, |
|
"ை": 49, |
|
"ொ": 50, |
|
"ோ": 51, |
|
"ௌ": 52, |
|
"்": 53, |
|
"ௗ": 54, |
|
"ഥ": 55, |
|
"—": 56, |
|
"’": 57, |
|
"‚": 58, |
|
"•": 59, |
|
"…": 60, |
|
"′": 61, |
|
"″": 62, |
|
"◯": 63 |
|
} |
|
|