|
{ |
|
"add_bos_token": false, |
|
"add_eos_token": false, |
|
"add_prefix_space": false, |
|
"added_tokens_decoder": { |
|
"151643": { |
|
"content": "<|endoftext|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151644": { |
|
"content": "<|im_start|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151645": { |
|
"content": "<|im_end|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151646": { |
|
"content": "<|object_ref_start|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151647": { |
|
"content": "<|object_ref_end|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151648": { |
|
"content": "<|box_start|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151649": { |
|
"content": "<|box_end|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151650": { |
|
"content": "<|quad_start|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151651": { |
|
"content": "<|quad_end|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151652": { |
|
"content": "<|vision_start|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151653": { |
|
"content": "<|vision_end|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151654": { |
|
"content": "<|vision_pad|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151655": { |
|
"content": "<|image_pad|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151656": { |
|
"content": "<|video_pad|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151657": { |
|
"content": "<tool_call>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"151658": { |
|
"content": "</tool_call>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"151659": { |
|
"content": "<|fim_prefix|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"151660": { |
|
"content": "<|fim_middle|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"151661": { |
|
"content": "<|fim_suffix|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"151662": { |
|
"content": "<|fim_pad|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"151663": { |
|
"content": "<|repo_name|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"151664": { |
|
"content": "<|file_sep|>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": false |
|
}, |
|
"151665": { |
|
"content": "<img>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151666": { |
|
"content": "</img>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151667": { |
|
"content": "<IMG_CONTEXT>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151668": { |
|
"content": "<quad>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151669": { |
|
"content": "</quad>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151670": { |
|
"content": "<ref>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151671": { |
|
"content": "</ref>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151672": { |
|
"content": "<box>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
}, |
|
"151673": { |
|
"content": "</box>", |
|
"lstrip": false, |
|
"normalized": false, |
|
"rstrip": false, |
|
"single_word": false, |
|
"special": true |
|
} |
|
}, |
|
"additional_special_tokens": [ |
|
"<|im_start|>", |
|
"<|im_end|>", |
|
"<|object_ref_start|>", |
|
"<|object_ref_end|>", |
|
"<|box_start|>", |
|
"<|box_end|>", |
|
"<|quad_start|>", |
|
"<|quad_end|>", |
|
"<|vision_start|>", |
|
"<|vision_end|>", |
|
"<|vision_pad|>", |
|
"<|image_pad|>", |
|
"<|video_pad|>", |
|
"<img>", |
|
"</img>", |
|
"<IMG_CONTEXT>", |
|
"<quad>", |
|
"</quad>", |
|
"<ref>", |
|
"</ref>", |
|
"<box>", |
|
"</box>" |
|
], |
|
"bos_token": null, |
|
"chat_template": "{% set system_message = 'You are a helpful assistant.' %}{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% endif %}{{ '<|im_start|>system\\n' + system_message + '<|im_end|>\\n' }}{% for message in loop_messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{% if content is iterable and content is sequence and content[0]['type'] == 'image' %}{{ '<|im_start|>user\\n<image>\\n' + content[1]['text'] + '<|im_end|>\\n<|im_start|>assistant\\n' }}{% else %}{{ '<|im_start|>user\\n' + content + '<|im_end|>\\n<|im_start|>assistant\\n' }}{% endif %}{% elif message['role'] == 'assistant' %}{% if content is iterable and content is sequence %}{% for part in content %}{% if part['type'] == 'text' %}{{ part['text'] }}{% endif %}{% endfor %}{{ '<|im_end|>\\n' }}{% else %}{{ content + '<|im_end|>\\n' }}{% endif %}{% endif %}{% endfor %}", |
|
"clean_up_tokenization_spaces": false, |
|
"eos_token": "<|im_end|>", |
|
"errors": "replace", |
|
"extra_special_tokens": {}, |
|
"model_max_length": 16384, |
|
"pad_token": "<|endoftext|>", |
|
"processor_class": "InternVL2_5Processor", |
|
"split_special_tokens": false, |
|
"tokenizer_class": "Qwen2Tokenizer", |
|
"unk_token": null |
|
} |
|
|