mahnerak commited on
Commit
55bfe5b
·
verified ·
1 Parent(s): 697f758

Upload tokenizer.json

Browse files
Files changed (1) hide show
  1. tokenizer.json +8 -4
tokenizer.json CHANGED
@@ -214,10 +214,14 @@
214
  ]
215
  },
216
  "post_processor": {
217
- "type": "ByteLevel",
218
- "add_prefix_space": true,
219
- "trim_offsets": false,
220
- "use_regex": true
 
 
 
 
221
  },
222
  "decoder": {
223
  "type": "ByteLevel",
 
214
  ]
215
  },
216
  "post_processor": {
217
+ "type": "TemplateProcessing",
218
+ "single": [
219
+ { "SpecialToken": { "id": "<|begin_of_text|>", "type_id": 0 } },
220
+ { "Sequence": { "id": "A", "type_id": 0 } }
221
+ ],
222
+ "special_tokens": {
223
+ "<|begin_of_text|>": { "id": "<|begin_of_text|>", "ids": [100256], "tokens": ["<|begin_of_text|>"] }
224
+ }
225
  },
226
  "decoder": {
227
  "type": "ByteLevel",