File size: 528 Bytes
e25f6c6
 
 
 
 
 
 
 
 
 
 
 
 
 
f1c406b
e25f6c6
 
 
 
a590c04
e25f6c6
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
{
  "add_prefix_space": false,
  "bos_token": "<s>",
  "cls_token": "<s>",
  "eos_token": "</s>",
  "errors": "replace",
  "mask_token": {
    "__type": "AddedToken",
    "content": "<mask>",
    "lstrip": true,
    "normalized": false,
    "rstrip": false,
    "single_word": false
  },
  "model_max_length": 1024,
  "name_or_path": "Tristan/olm-tokenizer",
  "pad_token": "<pad>",
  "sep_token": "</s>",
  "special_tokens_map_file": null,
  "tokenizer_class": "GPT2Tokenizer",
  "trim_offsets": true,
  "unk_token": "<unk>"
}