File size: 467 Bytes
f472ef8
 
 
 
 
 
 
 
 
 
9ff1d40
f472ef8
9ff1d40
f472ef8
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
{
    "bos_token": "[CLS]",
    "eos_token": "[SEP]",
    "unk_token": "<unk>",
    "sep_token": "[SEP]",
    "cls_token": "[CLS]",
    "pad_token": "<pad>",
    "mask_token": {
        "content": "[MASK]",
        "single_word": false,
        "lstrip": true,
        "rstrip": false,
        "normalized": true,
        "__type": "AddedToken"
    },
    "model_max_length": 512,
    "special_tokens_map_file": null,
    "name_or_path": "SaulLu/bengali-tokenizer"
}