File size: 1,227 Bytes

11f3e30
a36c438
11f3e30
 
b1e3621
11f3e30
a36c438
11f3e30
 
 
 
b1e3621
 
11f3e30
a36c438
11f3e30
 
 
 
b1e3621
 
11f3e30
a36c438
11f3e30
 
 
 
b1e3621
 
11f3e30
a36c438
11f3e30
 
 
 
a36c438
b1e3621
 
a36c438
11f3e30
 
 
 
 
b1e3621
11f3e30
b1e3621
 
a36c438
b1e3621
a36c438
11f3e30
b1e3621
 
a36c438
 
b1e3621
11f3e30

{
  "add_prefix_space": true,
  "added_tokens_decoder": {
    "0": {
      "content": "<s>",
      "lstrip": false,
      "normalized": true,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "1": {
      "content": "<pad>",
      "lstrip": false,
      "normalized": true,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "2": {
      "content": "</s>",
      "lstrip": false,
      "normalized": true,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "3": {
      "content": "<unk>",
      "lstrip": false,
      "normalized": true,
      "rstrip": false,
      "single_word": false,
      "special": true
    },
    "4": {
      "content": "<mask>",
      "lstrip": true,
      "normalized": true,
      "rstrip": false,
      "single_word": false,
      "special": true
    }
  },
  "bos_token": "<s>",
  "clean_up_tokenization_spaces": true,
  "cls_token": "<s>",
  "eos_token": "</s>",
  "errors": "replace",
  "mask_token": "<mask>",
  "max_len": 512,
  "model_max_length": 512,
  "pad_token": "<pad>",
  "sep_token": "</s>",
  "tokenizer_class": "RobertaTokenizer",
  "trim_offsets": true,
  "unk_token": "<unk>"
}