|
{ |
|
"added_tokens_decoder": { |
|
"0": { |
|
"content": "<pad>", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"1": { |
|
"content": "<s>", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"2": { |
|
"content": "</s>", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"3": { |
|
"content": "<unk>", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"7": { |
|
"content": "ph", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"8": { |
|
"content": "jh", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"9": { |
|
"content": "ch", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"12": { |
|
"content": "rq", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"13": { |
|
"content": "sx", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"14": { |
|
"content": "lx", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"16": { |
|
"content": "dxq", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"17": { |
|
"content": "nj", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"18": { |
|
"content": "ei", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"20": { |
|
"content": "tx", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"21": { |
|
"content": "gh", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"22": { |
|
"content": "txh", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"24": { |
|
"content": "th", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"26": { |
|
"content": "mq", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"27": { |
|
"content": "uu", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"28": { |
|
"content": "kh", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"33": { |
|
"content": "dh", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"34": { |
|
"content": "sh", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"35": { |
|
"content": "ee", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"36": { |
|
"content": "ii", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"37": { |
|
"content": "dxhq", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"38": { |
|
"content": "ax", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"39": { |
|
"content": "aa", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"40": { |
|
"content": "bh", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"44": { |
|
"content": "dx", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"45": { |
|
"content": "ou", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"47": { |
|
"content": "gq", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"49": { |
|
"content": "khq", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"50": { |
|
"content": "dxh", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"51": { |
|
"content": "ae", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"52": { |
|
"content": "kq", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"53": { |
|
"content": "nx", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"54": { |
|
"content": "ng", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"60": { |
|
"content": "hq", |
|
"lstrip": true, |
|
"normalized": false, |
|
"rstrip": true, |
|
"single_word": false, |
|
"special": false |
|
} |
|
}, |
|
"bos_token": "<s>", |
|
"clean_up_tokenization_spaces": true, |
|
"do_lower_case": false, |
|
"eos_token": "</s>", |
|
"model_max_length": 1000000000000000019884624838656, |
|
"pad_token": "<pad>", |
|
"processor_class": "Wav2Vec2Processor", |
|
"replace_word_delimiter_char": " ", |
|
"target_lang": null, |
|
"tokenizer_class": "Wav2Vec2CTCTokenizer", |
|
"unk_token": "<unk>", |
|
"word_delimiter_token": "|" |
|
} |
|
|