PEFT
Safetensors
mistral
trl
sft
Generated from Trainer
HachiML commited on
Commit
71908cb
1 Parent(s): 0054e50

Upload tokenizer

Browse files
Files changed (2) hide show
  1. tokenizer.json +6 -16
  2. tokenizer_config.json +1 -0
tokenizer.json CHANGED
@@ -6943,23 +6943,13 @@
6943
  "special": true
6944
  }
6945
  ],
6946
- "normalizer": {
6947
- "type": "Sequence",
6948
- "normalizers": [
6949
- {
6950
- "type": "Prepend",
6951
- "prepend": "▁"
6952
- },
6953
- {
6954
- "type": "Replace",
6955
- "pattern": {
6956
- "String": " "
6957
- },
6958
- "content": "▁"
6959
- }
6960
- ]
6961
  },
6962
- "pre_tokenizer": null,
6963
  "post_processor": {
6964
  "type": "TemplateProcessing",
6965
  "single": [
 
6943
  "special": true
6944
  }
6945
  ],
6946
+ "normalizer": null,
6947
+ "pre_tokenizer": {
6948
+ "type": "Metaspace",
6949
+ "replacement": "▁",
6950
+ "prepend_scheme": "first",
6951
+ "split": false
 
 
 
 
 
 
 
 
 
6952
  },
 
6953
  "post_processor": {
6954
  "type": "TemplateProcessing",
6955
  "single": [
tokenizer_config.json CHANGED
@@ -6173,6 +6173,7 @@
6173
  }
6174
  },
6175
  "bos_token": "<s>",
 
6176
  "clean_up_tokenization_spaces": false,
6177
  "eos_token": "</s>",
6178
  "legacy": false,
 
6173
  }
6174
  },
6175
  "bos_token": "<s>",
6176
+ "chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
6177
  "clean_up_tokenization_spaces": false,
6178
  "eos_token": "</s>",
6179
  "legacy": false,