Jujeong
/

1k_dataset_ft_adaper

Model card Files Files and versions Metrics Training metrics Community

1k_dataset_ft_adaper / tokenizer_config.json

Jujeong's picture

Initial commit

cff336f verified 11 days ago

raw history blame contribute delete

No virus

1.95 kB

	{
	"add_bos_token": false,
	"add_eos_token": false,
	"add_prefix_space": true,
	"added_tokens_decoder": {
	"0": {
	"content": "<\|pad\|>",
	"lstrip": false,
	"normalized": false,
	"rstrip": false,
	"single_word": false,
	"special": true
	},
	"1": {
	"content": "<\|begin_of_text\|>",
	"lstrip": false,
	"normalized": false,
	"rstrip": false,
	"single_word": false,
	"special": true
	},
	"2": {
	"content": "<\|end_of_text\|>",
	"lstrip": false,
	"normalized": false,
	"rstrip": false,
	"single_word": false,
	"special": true
	},
	"5": {
	"content": "<\|eot_id\|>",
	"lstrip": false,
	"normalized": false,
	"rstrip": false,
	"single_word": false,
	"special": true
	},
	"6": {
	"content": "<\|start_header_id\|>",
	"lstrip": false,
	"normalized": false,
	"rstrip": false,
	"single_word": false,
	"special": true
	},
	"7": {
	"content": "<\|end_header_id\|>",
	"lstrip": false,
	"normalized": false,
	"rstrip": false,
	"single_word": false,
	"special": true
	}
	},
	"bos_token": "<\|begin_of_text\|>",
	"chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<\|start_header_id\|>' + message['role'] + '<\|end_header_id\|>\n\n'+ message['content'] \| trim + '<\|eot_id\|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<\|start_header_id\|>assistant<\|end_header_id\|>\n\n' }}{% endif %}",
	"clean_up_tokenization_spaces": false,
	"eos_token": "<\|end_of_text\|>",
	"legacy": true,
	"model_max_length": 4096,
	"pad_token": "<\|pad\|>",
	"padding_side": "right",
	"sp_model_kwargs": {},
	"spaces_between_special_tokens": false,
	"tokenizer_class": "PreTrainedTokenizerFast",
	"use_default_system_prompt": false
	}