File size: 471 Bytes
df95ac1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
{
    "bos_token": "[CLS]",
    "eos_token": "[SEP]",
    "unk_token": "<unk>",
    "sep_token": "[SEP]",
    "cls_token": "[CLS]",
    "pad_token": "<pad>",
    "mask_token": {
        "content": "[MASK]",
        "single_word": false,
        "lstrip": true,
        "rstrip": false,
        "normalized": false,
        "__type": "AddedToken"
    },
    "model_max_length": 512,
    "special_tokens_map_file": null,
    "name_or_path": "SaulLu/bengali-tokenizer-v2"
}