maltehb commited on
Commit
3d6951e
1 Parent(s): 4459c08
Files changed (5) hide show
  1. config.json +1 -1
  2. special_tokens_map.json +1 -15
  3. tokenizer.json +0 -0
  4. tokenizer_config.json +1 -14
  5. vocab.json +0 -0
config.json CHANGED
@@ -24,4 +24,4 @@
24
  "type_vocab_size": 1,
25
  "use_cache": true,
26
  "vocab_size": 50265
27
- }
 
24
  "type_vocab_size": 1,
25
  "use_cache": true,
26
  "vocab_size": 50265
27
+ }
special_tokens_map.json CHANGED
@@ -1,15 +1 @@
1
- {
2
- "bos_token": "<s>",
3
- "eos_token": "</s>",
4
- "unk_token": "<unk>",
5
- "sep_token": "</s>",
6
- "pad_token": "<pad>",
7
- "cls_token": "<s>",
8
- "mask_token": {
9
- "content": "<mask>",
10
- "single_word": false,
11
- "lstrip": true,
12
- "rstrip": false,
13
- "normalized": false
14
- }
15
- }
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,14 +1 @@
1
- {
2
- "unk_token": "<unk>",
3
- "bos_token": "<s>",
4
- "eos_token": "</s>",
5
- "add_prefix_space": false,
6
- "errors": "replace",
7
- "sep_token": "</s>",
8
- "cls_token": "<s>",
9
- "pad_token": "<pad>",
10
- "mask_token": "<mask>",
11
- "special_tokens_map_file": null,
12
- "name_or_path": "./",
13
- "tokenizer_class": "RobertaTokenizer"
14
- }
 
1
+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "add_prefix_space": false, "errors": "replace", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": "<mask>", "special_tokens_map_file": null, "name_or_path": "./", "tokenizer_class": "RobertaTokenizer"}
 
 
 
 
 
 
 
 
 
 
 
 
 
vocab.json CHANGED
The diff for this file is too large to render. See raw diff