{ "additional_special_tokens": [ "Cj", "V", "Num", "Pron", "N", "A", "Adv", "Other", "Interj", "Pp", "" ], "clean_up_tokenization_spaces": true, "cls_token": "", "do_lower_case": true, "mask_token": "[MASK]", "model_input_names": [ "input_ids", "attention_mask", "decoder_input_ids" ], "model_max_length": 1024, "pad_token": "", "sep_token": "", "strip_accents": null, "tokenize_chinese_chars": true, "tokenizer_class": "BertTokenizer", "unk_token": "" }