File size: 805 Bytes
a7345ac
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
{
    "do_lower_case":true,
    "remove_space":true,
    "keep_accents":true,
    "bos_token": "[CLS]",
    "eos_token": "[SEP]",
    "unk_token": "<unk>",
    "sep_token": "[SEP]",
    "pad_token": "<pad>",
    "cls_token": "[CLS]",
    "mask_token":{
       "content":"[MASK]",
       "single_word":false,
       "lstrip":true,
       "rstrip":false,
       "normalized":false,
       "__type":"AddedToken"
    },
    "tokenize_chinese_chars":false,
    "tokenizer_class": "BertJapaneseTokenizer",
    "word_tokenizer_type": "mecab",
    "subword_tokenizer_type": "sentencepiece",
    "mecab_kwargs": {
        "mecab_dic": "unidic_lite"
    },
    "auto_map": {
        "AutoTokenizer": [
            "distilbert_japanese_tokenizer.DistilBertJapaneseTokenizer",
            null
        ]
     }    
}