Upload tokenizer
32b9d91
verified
|
{ |
|
"\t": 0, |
|
"0": 1, |
|
"1": 2, |
|
"2": 3, |
|
"3": 4, |
|
"4": 5, |
|
"5": 6, |
|
"6": 7, |
|
"7": 8, |
|
"8": 9, |
|
"9": 10, |
|
"[PAD]": 61, |
|
"[UNK]": 60, |
|
"|": 11, |
|
"ஃ": 12, |
|
"அ": 13, |
|
"ஆ": 14, |
|
"இ": 15, |
|
"ஈ": 16, |
|
"உ": 17, |
|
"ஊ": 18, |
|
"எ": 19, |
|
"ஏ": 20, |
|
"ஐ": 21, |
|
"ஒ": 22, |
|
"ஓ": 23, |
|
"க": 24, |
|
"ங": 25, |
|
"ச": 26, |
|
"ஜ": 27, |
|
"ஞ": 28, |
|
"ட": 29, |
|
"ண": 30, |
|
"த": 31, |
|
"ந": 32, |
|
"ன": 33, |
|
"ப": 34, |
|
"ம": 35, |
|
"ய": 36, |
|
"ர": 37, |
|
"ற": 38, |
|
"ல": 39, |
|
"ள": 40, |
|
"ழ": 41, |
|
"வ": 42, |
|
"ஷ": 43, |
|
"ஸ": 44, |
|
"ஹ": 45, |
|
"ா": 46, |
|
"ி": 47, |
|
"ீ": 48, |
|
"ு": 49, |
|
"ூ": 50, |
|
"ெ": 51, |
|
"ே": 52, |
|
"ை": 53, |
|
"ொ": 54, |
|
"ோ": 55, |
|
"ௌ": 56, |
|
"்": 57, |
|
"": 58, |
|
"…": 59 |
|
} |
|
|