ZhiyuanChen commited on
Commit
bb040c5
·
verified ·
1 Parent(s): 241bdef

Upload tokenizer

Browse files
Files changed (2) hide show
  1. special_tokens_map.json +3 -0
  2. tokenizer_config.json +11 -0
special_tokens_map.json CHANGED
@@ -1,4 +1,7 @@
1
  {
 
 
 
2
  "bos_token": "<cls>",
3
  "cls_token": "<cls>",
4
  "eos_token": "<eos>",
 
1
  {
2
+ "additional_special_tokens": [
3
+ "<null>"
4
+ ],
5
  "bos_token": "<cls>",
6
  "cls_token": "<cls>",
7
  "eos_token": "<eos>",
tokenizer_config.json CHANGED
@@ -39,8 +39,19 @@
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
 
 
 
 
 
 
 
 
42
  }
43
  },
 
 
 
44
  "bos_token": "<cls>",
45
  "clean_up_tokenization_spaces": true,
46
  "cls_token": "<cls>",
 
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
42
+ },
43
+ "5": {
44
+ "content": "<null>",
45
+ "lstrip": false,
46
+ "normalized": false,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": true
50
  }
51
  },
52
+ "additional_special_tokens": [
53
+ "<null>"
54
+ ],
55
  "bos_token": "<cls>",
56
  "clean_up_tokenization_spaces": true,
57
  "cls_token": "<cls>",