mms-tts-grc / vocab.json
sanchit-gandhi's picture
Upload tokenizer
4b450eb
{
" ": 31,
"'": 81,
"-": 21,
"_": 118,
"ΐ": 37,
"ά": 12,
"έ": 15,
"ή": 70,
"ί": 90,
"ΰ": 27,
"α": 102,
"β": 46,
"γ": 20,
"δ": 87,
"ε": 96,
"ζ": 73,
"η": 19,
"θ": 9,
"ι": 91,
"κ": 24,
"λ": 39,
"μ": 26,
"ν": 99,
"ξ": 22,
"ο": 77,
"π": 14,
"ρ": 2,
"ς": 23,
"σ": 56,
"τ": 44,
"υ": 40,
"φ": 69,
"χ": 55,
"ψ": 5,
"ω": 106,
"ϊ": 103,
"ϋ": 94,
"ό": 83,
"ύ": 72,
"ώ": 114,
"ἀ": 54,
"ἁ": 41,
"ἂ": 76,
"ἃ": 88,
"ἄ": 7,
"ἅ": 57,
"ἆ": 48,
"ἐ": 53,
"ἑ": 60,
"ἓ": 47,
"ἔ": 32,
"ἕ": 85,
"ἠ": 86,
"ἡ": 92,
"ἢ": 16,
"ἣ": 78,
"ἤ": 0,
"ἥ": 111,
"ἦ": 59,
"ἧ": 45,
"ἰ": 79,
"ἱ": 52,
"ἳ": 84,
"ἴ": 109,
"ἵ": 107,
"ἶ": 6,
"ἷ": 61,
"ὀ": 95,
"ὁ": 67,
"ὃ": 97,
"ὄ": 35,
"ὅ": 43,
"ὐ": 93,
"ὑ": 10,
"ὒ": 25,
"ὓ": 28,
"ὔ": 42,
"ὕ": 110,
"ὖ": 80,
"ὗ": 3,
"ὠ": 29,
"ὡ": 1,
"ὢ": 8,
"ὤ": 75,
"ὥ": 100,
"ὦ": 113,
"ὧ": 74,
"ὰ": 71,
"ὲ": 112,
"ὴ": 105,
"ὶ": 34,
"ὸ": 33,
"ὺ": 117,
"ὼ": 30,
"ᾄ": 58,
"ᾅ": 18,
"ᾐ": 108,
"ᾑ": 50,
"ᾔ": 104,
"ᾖ": 98,
"ᾗ": 49,
"ᾠ": 17,
"ᾧ": 4,
"ᾳ": 38,
"ᾶ": 36,
"ᾷ": 115,
"ῃ": 116,
"ῄ": 63,
"ῆ": 51,
"ῇ": 13,
"ῒ": 62,
"ῖ": 65,
"ῥ": 68,
"ῦ": 101,
"ῳ": 64,
"ῴ": 89,
"ῶ": 82,
"ῷ": 66,
"–": 11
}