Upload tokenizer
1cf75ac
verified
|
{ |
|
"\t": 0, |
|
"[PAD]": 77, |
|
"[UNK]": 76, |
|
"|": 1, |
|
"ං": 2, |
|
"ඃ": 3, |
|
"අ": 4, |
|
"ආ": 5, |
|
"ඇ": 6, |
|
"ඈ": 7, |
|
"ඉ": 8, |
|
"ඊ": 9, |
|
"උ": 10, |
|
"ඌ": 11, |
|
"ඍ": 12, |
|
"එ": 13, |
|
"ඒ": 14, |
|
"ඓ": 15, |
|
"ඔ": 16, |
|
"ඕ": 17, |
|
"ඖ": 18, |
|
"ක": 19, |
|
"ඛ": 20, |
|
"ග": 21, |
|
"ඝ": 22, |
|
"ඞ": 23, |
|
"ඟ": 24, |
|
"ච": 25, |
|
"ඡ": 26, |
|
"ජ": 27, |
|
"ඤ": 28, |
|
"ඥ": 29, |
|
"ට": 30, |
|
"ඨ": 31, |
|
"ඩ": 32, |
|
"ඪ": 33, |
|
"ණ": 34, |
|
"ඬ": 35, |
|
"ත": 36, |
|
"ථ": 37, |
|
"ද": 38, |
|
"ධ": 39, |
|
"න": 40, |
|
"ඳ": 41, |
|
"ප": 42, |
|
"ඵ": 43, |
|
"බ": 44, |
|
"භ": 45, |
|
"ම": 46, |
|
"ඹ": 47, |
|
"ය": 48, |
|
"ර": 49, |
|
"ල": 50, |
|
"ව": 51, |
|
"ශ": 52, |
|
"ෂ": 53, |
|
"ස": 54, |
|
"හ": 55, |
|
"ළ": 56, |
|
"ෆ": 57, |
|
"්": 58, |
|
"ා": 59, |
|
"ැ": 60, |
|
"ෑ": 61, |
|
"ි": 62, |
|
"ී": 63, |
|
"ු": 64, |
|
"ූ": 65, |
|
"ෘ": 66, |
|
"ෙ": 67, |
|
"ේ": 68, |
|
"ෛ": 69, |
|
"ො": 70, |
|
"ෝ": 71, |
|
"ෞ": 72, |
|
"ෲ": 73, |
|
"": 74, |
|
"": 75 |
|
} |
|
|