typeof commited on
Commit
62fd940
1 Parent(s): ae303c9
Files changed (1) hide show
  1. tokenizer.json +1 -76
tokenizer.json CHANGED
@@ -59,81 +59,6 @@
59
  "pre_tokenizer": {
60
  "type": "BertPreTokenizer"
61
  },
62
- "post_processor": {
63
- "type": "TemplateProcessing",
64
- "single": [
65
- {
66
- "SpecialToken": {
67
- "id": "[CLS]",
68
- "type_id": 0
69
- }
70
- },
71
- {
72
- "Sequence": {
73
- "id": "A",
74
- "type_id": 0
75
- }
76
- },
77
- {
78
- "SpecialToken": {
79
- "id": "[SEP]",
80
- "type_id": 0
81
- }
82
- }
83
- ],
84
- "pair": [
85
- {
86
- "SpecialToken": {
87
- "id": "[CLS]",
88
- "type_id": 0
89
- }
90
- },
91
- {
92
- "Sequence": {
93
- "id": "A",
94
- "type_id": 0
95
- }
96
- },
97
- {
98
- "SpecialToken": {
99
- "id": "[SEP]",
100
- "type_id": 0
101
- }
102
- },
103
- {
104
- "Sequence": {
105
- "id": "B",
106
- "type_id": 1
107
- }
108
- },
109
- {
110
- "SpecialToken": {
111
- "id": "[SEP]",
112
- "type_id": 1
113
- }
114
- }
115
- ],
116
- "special_tokens": {
117
- "[CLS]": {
118
- "id": "[CLS]",
119
- "ids": [
120
- 101
121
- ],
122
- "tokens": [
123
- "[CLS]"
124
- ]
125
- },
126
- "[SEP]": {
127
- "id": "[SEP]",
128
- "ids": [
129
- 102
130
- ],
131
- "tokens": [
132
- "[SEP]"
133
- ]
134
- }
135
- }
136
- },
137
  "decoder": {
138
  "type": "WordPiece",
139
  "prefix": "##",
@@ -146,7 +71,7 @@
146
  "max_input_chars_per_word": 100,
147
  "vocab": {
148
  "[PAD]": 0,
149
- "[unused0]": 1,
150
  "[unused1]": 2,
151
  "[unused2]": 3,
152
  "[unused3]": 4,
 
59
  "pre_tokenizer": {
60
  "type": "BertPreTokenizer"
61
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
62
  "decoder": {
63
  "type": "WordPiece",
64
  "prefix": "##",
 
71
  "max_input_chars_per_word": 100,
72
  "vocab": {
73
  "[PAD]": 0,
74
+ "[EOS]": 1,
75
  "[unused1]": 2,
76
  "[unused2]": 3,
77
  "[unused3]": 4,