File size: 805 Bytes
a7345ac |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 |
{
"do_lower_case":true,
"remove_space":true,
"keep_accents":true,
"bos_token": "[CLS]",
"eos_token": "[SEP]",
"unk_token": "<unk>",
"sep_token": "[SEP]",
"pad_token": "<pad>",
"cls_token": "[CLS]",
"mask_token":{
"content":"[MASK]",
"single_word":false,
"lstrip":true,
"rstrip":false,
"normalized":false,
"__type":"AddedToken"
},
"tokenize_chinese_chars":false,
"tokenizer_class": "BertJapaneseTokenizer",
"word_tokenizer_type": "mecab",
"subword_tokenizer_type": "sentencepiece",
"mecab_kwargs": {
"mecab_dic": "unidic_lite"
},
"auto_map": {
"AutoTokenizer": [
"distilbert_japanese_tokenizer.DistilBertJapaneseTokenizer",
null
]
}
} |