Update tokenizer_config.json (#7)
Browse files- Update tokenizer_config.json (4493e8fbb85953bd4e6d8b62a5c47cad99ebc2d9)
- tokenizer_config.json +12 -1
tokenizer_config.json
CHANGED
@@ -4753,11 +4753,22 @@
|
|
4753 |
"rstrip": false,
|
4754 |
"single_word": false,
|
4755 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4756 |
}
|
4757 |
},
|
4758 |
"bos_token": "<|begin▁of▁sentence|>",
|
4759 |
"clean_up_tokenization_spaces": false,
|
4760 |
-
"chat_template":
|
|
|
|
|
|
|
4761 |
"eos_token": "<|end▁of▁sentence|>",
|
4762 |
"model_max_length": 16384,
|
4763 |
"pad_token": "<|▁pad▁|>",
|
|
|
4753 |
"rstrip": false,
|
4754 |
"single_word": false,
|
4755 |
"special": true
|
4756 |
+
},
|
4757 |
+
"102400": {
|
4758 |
+
"content": "<image_placeholder>",
|
4759 |
+
"lstrip": false,
|
4760 |
+
"normalized": false,
|
4761 |
+
"rstrip": false,
|
4762 |
+
"single_word": false,
|
4763 |
+
"special": true
|
4764 |
}
|
4765 |
},
|
4766 |
"bos_token": "<|begin▁of▁sentence|>",
|
4767 |
"clean_up_tokenization_spaces": false,
|
4768 |
+
"chat_template": {
|
4769 |
+
"default": "{% if messages[0]['role'] | lower == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'You are a helpful language and vision assistant. You are able to understand the visual content that the user provides, and assist the user with a variety of tasks using natural language.' %}{% endif %}{{ bos_token + system_message }}{% for message in loop_messages %}{{ '\\n\\n' + message['role'] + ': ' + message['content'] | trim }}{% endfor %}{% if add_generation_prompt %}{{ '\\n\\n' + 'Assistant:' }}{% endif %}",
|
4770 |
+
"text_to_image": "{{ '<|begin▁of▁sentence|>' }}{% for message in messages %}{{ message['role'] + ': ' + message['content'] | trim + '\\n\\n' }}{% endfor %}{% if add_generation_prompt %}{{ 'Assistant:<begin_of_image>' }}{% endif %}"
|
4771 |
+
},
|
4772 |
"eos_token": "<|end▁of▁sentence|>",
|
4773 |
"model_max_length": 16384,
|
4774 |
"pad_token": "<|▁pad▁|>",
|