|
{
|
|
"added_tokens_decoder": {
|
|
"59246": {
|
|
"content": "<|endoftext|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59247": {
|
|
"content": "[MASK]",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59248": {
|
|
"content": "[gMASK]",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59249": {
|
|
"content": "[sMASK]",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59250": {
|
|
"content": "<sop>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59251": {
|
|
"content": "<eop>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59252": {
|
|
"content": "<|system|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59253": {
|
|
"content": "<|user|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59254": {
|
|
"content": "<|assistant|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59255": {
|
|
"content": "<|observation|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59256": {
|
|
"content": "<|begin_of_image|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59257": {
|
|
"content": "<|end_of_image|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59258": {
|
|
"content": "<|begin_of_video|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
},
|
|
"59259": {
|
|
"content": "<|end_of_video|>",
|
|
"lstrip": false,
|
|
"normalized": false,
|
|
"rstrip": false,
|
|
"single_word": false,
|
|
"special": true
|
|
}
|
|
},
|
|
"additional_special_tokens": [
|
|
"<|endoftext|>",
|
|
"[MASK]",
|
|
"[gMASK]",
|
|
"[sMASK]",
|
|
"<sop>",
|
|
"<eop>",
|
|
"<|system|>",
|
|
"<|user|>",
|
|
"<|assistant|>",
|
|
"<|observation|>",
|
|
"<|begin_of_image|>",
|
|
"<|end_of_image|>",
|
|
"<|begin_of_video|>",
|
|
"<|end_of_video|>"
|
|
],
|
|
"chat_template": "{% for item in messages %}{% if item['role'] == 'system' %}<|system|>\n{{ item['content'] }}{% elif item['role'] == 'user' %}<|user|>\n{{ item['content'] }}{% elif item['role'] == 'assistant' %}<|assistant|>\n{{ item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant|>\n{% endif %}",
|
|
"clean_up_tokenization_spaces": false,
|
|
"do_lower_case": false,
|
|
"eos_token": "<|endoftext|>",
|
|
"extra_special_tokens": {},
|
|
"image_size": 448,
|
|
"model_input_names": [
|
|
"input_ids",
|
|
"attention_mask"
|
|
],
|
|
"model_max_length": 8192,
|
|
"pad_token": "<|endoftext|>",
|
|
"padding_side": "left",
|
|
"remove_space": false,
|
|
"tokenizer_class": "PreTrainedTokenizerFast"
|
|
}
|
|
|