dummy-tokenizer-fast-with-model-config / special_tokens_map.json
SaulLu's picture
add tokenizer example with model config
8a27784
{
"bos_token": {
"content": "[CLS]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true
},
"eos_token": {
"content": "[SEP]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true
},
"unk_token": {
"content": "[UNK]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true
},
"sep_token": {
"content": "[SEP]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true
},
"pad_token": {
"content": "[PAD]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true
},
"cls_token": {
"content": "[CLS]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true
},
"mask_token": {
"content": "[MASK]",
"single_word": false,
"lstrip": true,
"rstrip": false,
"normalized": true
}
}