Jubliano's picture
Upload tokenizer
910bea4 verified
{
"added_tokens_decoder": {
"0": {
"content": "iɛ2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"1": {
"content": "æiː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"3": {
"content": "oe",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"4": {
"content": "əɪ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"5": {
"content": "s.",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"6": {
"content": "iɑɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"7": {
"content": "mʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"9": {
"content": "y:",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"10": {
"content": "ɑ4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"11": {
"content": "ẽ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"12": {
"content": "oɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"13": {
"content": "ɔɪ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"15": {
"content": "th",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"17": {
"content": "onɡ5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"18": {
"content": "i̪1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"19": {
"content": "eɑ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"20": {
"content": "ua1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"21": {
"content": "ai̯",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"22": {
"content": "tɕ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"23": {
"content": "ts.h",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"24": {
"content": "yː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"26": {
"content": "dʰː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"27": {
"content": "i̪ɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"29": {
"content": "cʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"30": {
"content": "o̞",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"31": {
"content": "dʒʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"32": {
"content": "sʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"34": {
"content": "aiɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"35": {
"content": "ɕʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"36": {
"content": "i.4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"37": {
"content": "o4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"38": {
"content": "ai2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"41": {
"content": "ɖʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"42": {
"content": "s̪",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"44": {
"content": "o1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"45": {
"content": "ei2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"46": {
"content": "ɑː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"47": {
"content": "ph",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"48": {
"content": "tʃ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"50": {
"content": "dʑ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"51": {
"content": "ɪː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"52": {
"content": "i̪5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"53": {
"content": "aɨ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"55": {
"content": "i̪2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"57": {
"content": "i.5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"58": {
"content": "a.ː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"59": {
"content": "ɛ̃",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"60": {
"content": "ɡʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"61": {
"content": "u4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"62": {
"content": "oɪ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"63": {
"content": "iou2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"64": {
"content": "dZ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"65": {
"content": "kː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"66": {
"content": "ʒʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"67": {
"content": "ɛɹ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"69": {
"content": "kh",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"70": {
"content": "tɕh",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"71": {
"content": "iɛ1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"73": {
"content": "bː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"74": {
"content": "iɑ1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"75": {
"content": "ɡː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"79": {
"content": "ɹ̩",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"82": {
"content": "ər4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"84": {
"content": "yɛ5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"86": {
"content": "yi",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"87": {
"content": "eə",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"89": {
"content": "tʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"90": {
"content": "t̪",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"93": {
"content": "o5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"94": {
"content": "uo",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"95": {
"content": "uo5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"96": {
"content": "yæ2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"99": {
"content": "ai5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"101": {
"content": "rʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"102": {
"content": "iː1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"103": {
"content": "ɯᵝɯᵝ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"104": {
"content": "tʃʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"107": {
"content": "au̯",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"108": {
"content": "a4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"109": {
"content": "ã",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"110": {
"content": "tsʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"111": {
"content": "uɪ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"113": {
"content": "tʃː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"115": {
"content": "õ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"116": {
"content": "eʊ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"118": {
"content": "dˤ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"119": {
"content": "yɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"120": {
"content": "ɪu",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"123": {
"content": "øi",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"124": {
"content": "iɛ4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"126": {
"content": "ɑu5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"127": {
"content": "aɪə",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"128": {
"content": "iouɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"129": {
"content": "œ̃",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"130": {
"content": "a.",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"131": {
"content": "ɭʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"134": {
"content": "oːɹ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"135": {
"content": "u2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"137": {
"content": "pʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"138": {
"content": "aʊ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"139": {
"content": "bʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"141": {
"content": "iʊ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"142": {
"content": "ɑ2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"145": {
"content": "ei̯",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"146": {
"content": "ɯᵝ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"147": {
"content": "ueiɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"149": {
"content": "ə1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"151": {
"content": "iɑ2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"153": {
"content": "eː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"155": {
"content": "yə2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"156": {
"content": "ɟʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"157": {
"content": "ei5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"158": {
"content": "s^",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"159": {
"content": "xʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"160": {
"content": "au",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"161": {
"content": "eɪ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"162": {
"content": "ua2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"163": {
"content": "iɛ5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"164": {
"content": "aɪɚ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"167": {
"content": "i.ɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"168": {
"content": "ua4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"169": {
"content": "ɔː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"170": {
"content": "o̞o̞",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"171": {
"content": "ɐ̃",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"174": {
"content": "iou4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"175": {
"content": "ou5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"177": {
"content": "pː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"179": {
"content": "ɵː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"180": {
"content": "pf",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"181": {
"content": "əː1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"183": {
"content": "yəɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"184": {
"content": "ɟː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"186": {
"content": "t̪ː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"187": {
"content": "yɛ5ʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"188": {
"content": "u:",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"189": {
"content": "uaɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"190": {
"content": "tɕʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"191": {
"content": "cː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"192": {
"content": "iɛɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"193": {
"content": "aɪ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"195": {
"content": "e:",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"196": {
"content": "kʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"197": {
"content": "əl",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"198": {
"content": "dʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"199": {
"content": "ʊɹ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"200": {
"content": "i1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"201": {
"content": "ou1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"202": {
"content": "uəɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"203": {
"content": "i.ː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"207": {
"content": "uei2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"208": {
"content": "onɡ2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"209": {
"content": "s̪ː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"210": {
"content": "ɪ^",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"211": {
"content": "tː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"212": {
"content": "t[",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"214": {
"content": "æi",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"215": {
"content": "??",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"217": {
"content": "i.",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"218": {
"content": "tɕʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"220": {
"content": "ɛʊ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"226": {
"content": "uɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"228": {
"content": "tʃʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"229": {
"content": "iə",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"230": {
"content": "r̝",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"231": {
"content": "dʒ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"232": {
"content": "cʰcʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"233": {
"content": "iːː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"235": {
"content": "œː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"236": {
"content": "ʊː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"238": {
"content": "y2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"240": {
"content": "ɐɐ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"241": {
"content": "əɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"242": {
"content": "ɑuɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"243": {
"content": "sx",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"244": {
"content": "ɑu2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"245": {
"content": "ɛː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"247": {
"content": "iou1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"249": {
"content": "ɻ̩",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"250": {
"content": "r̝̊",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"251": {
"content": "ɑ1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"252": {
"content": "tsh",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"253": {
"content": "ɔ̃",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"254": {
"content": "ɑːɹ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"255": {
"content": "ẽː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"256": {
"content": "ɑ:",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"257": {
"content": "u.",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"260": {
"content": "tsʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"261": {
"content": "t^",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"262": {
"content": "ərɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"263": {
"content": "aɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"264": {
"content": "æː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"265": {
"content": "ɔø",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"267": {
"content": "ts",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"268": {
"content": "tʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"269": {
"content": "oe:",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"271": {
"content": "ɑɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"272": {
"content": "yuɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"273": {
"content": "əʊ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"274": {
"content": "oː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"275": {
"content": "ɪɹ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"276": {
"content": "a2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"277": {
"content": "ʂʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"279": {
"content": "dzː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"281": {
"content": "fʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"282": {
"content": "ɡʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"283": {
"content": "ja",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"285": {
"content": "vʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"286": {
"content": "r.",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"287": {
"content": "ũ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"288": {
"content": "nʲʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"289": {
"content": "ɑ̃",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"290": {
"content": "a5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"291": {
"content": "aː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"293": {
"content": "i.1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"294": {
"content": "yɛ2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"296": {
"content": "ĩ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"298": {
"content": "əɨ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"299": {
"content": "ər5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"301": {
"content": "oʊ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"302": {
"content": "n̩",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"303": {
"content": "u1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"304": {
"content": "uoɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"305": {
"content": "i4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"306": {
"content": "t^ː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"308": {
"content": "dʑʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"309": {
"content": "ə4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"310": {
"content": "e̞",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"314": {
"content": "o2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"315": {
"content": "uə5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"317": {
"content": "øː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"318": {
"content": "dʲʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"320": {
"content": "ɑɨ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"321": {
"content": "u5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"322": {
"content": "ər1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"324": {
"content": "lː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"327": {
"content": "ɔɨ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"328": {
"content": "yɛɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"329": {
"content": "eiɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"330": {
"content": "uː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"331": {
"content": "i5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"335": {
"content": "ui",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"336": {
"content": "yæ5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"338": {
"content": "ʊə",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"339": {
"content": "tS",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"341": {
"content": "uɨ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"342": {
"content": "i:",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"343": {
"content": "ɨu",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"344": {
"content": "uo1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"345": {
"content": "dː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"347": {
"content": "ʈʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"349": {
"content": "pʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"350": {
"content": "ju",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"351": {
"content": "dʒː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"352": {
"content": "iɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"353": {
"content": "dˤdˤ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"354": {
"content": "ɐ̃ʊ̃",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"355": {
"content": "y1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"356": {
"content": "i̪4",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"357": {
"content": "yæɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"358": {
"content": "ɨː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"368": {
"content": "i.2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"369": {
"content": "uə2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"370": {
"content": "ɪuː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"371": {
"content": "ää",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"372": {
"content": "iː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"373": {
"content": "uo2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"374": {
"content": "o:",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"379": {
"content": "ua5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"380": {
"content": "ie",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"381": {
"content": "ɯɯ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"382": {
"content": "ʈʂʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"383": {
"content": "ɛɪ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"384": {
"content": "uai5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"385": {
"content": "yu2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"386": {
"content": "kʰː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"387": {
"content": "bʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"388": {
"content": "i2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"389": {
"content": "ou2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"391": {
"content": "ouɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"396": {
"content": "uaiɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"397": {
"content": "dʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"399": {
"content": "ər2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"400": {
"content": "yiɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"401": {
"content": "d[",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"404": {
"content": "qː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"405": {
"content": "ɜː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"406": {
"content": "yə5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"408": {
"content": "y5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"409": {
"content": "ɔːɹ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"410": {
"content": "a1",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"411": {
"content": "tsː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"413": {
"content": "onɡɜ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"414": {
"content": "ou̯",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"416": {
"content": "ee",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"417": {
"content": "r̩",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"419": {
"content": "d^",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"420": {
"content": "yu5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"422": {
"content": "nʲ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"424": {
"content": "ai",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"425": {
"content": "ə5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"426": {
"content": "ʈʂ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"430": {
"content": "e̞e̞",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"431": {
"content": "kʰ",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"432": {
"content": "ɑ5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"434": {
"content": "uei5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"435": {
"content": "u.ː",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"436": {
"content": "ə2",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"438": {
"content": "iɑ5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"439": {
"content": "l̩",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"442": {
"content": "ts.",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"443": {
"content": "u\"",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"444": {
"content": "iou5",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"446": {
"content": "[PAD]",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"447": {
"content": "[UNK]",
"lstrip": true,
"normalized": false,
"rstrip": true,
"single_word": false,
"special": false
},
"448": {
"content": "<s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
},
"449": {
"content": "</s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false,
"special": true
}
},
"bos_token": "<s>",
"clean_up_tokenization_spaces": true,
"do_lower_case": false,
"eos_token": "</s>",
"model_max_length": 1000000000000000019884624838656,
"pad_token": "[PAD]",
"replace_word_delimiter_char": " ",
"target_lang": null,
"tokenizer_class": "Wav2Vec2CTCTokenizer",
"unk_token": "[UNK]",
"word_delimiter_token": "|"
}