{ "add_bos_token": false, "add_prefix_space": false, "added_tokens_decoder": { "50256": { "content": "<|endoftext|>", "lstrip": false, "normalized": true, "rstrip": false, "single_word": false, "special": true }, "50257": { "content": "<||bos||>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "50258": { "content": "<||pad||>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "50259": { "content": "<||unk||>", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "50260": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "50261": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true }, "50262": { "content": "", "lstrip": false, "normalized": false, "rstrip": false, "single_word": false, "special": true } }, "additional_special_tokens": [ "<|endoftext|>", "<||bos||>", "<||pad||>", "<||unk||>", "", "", "" ], "bos_token": "", "clean_up_tokenization_spaces": true, "eos_token": "", "errors": "replace", "model_max_length": 8192, "pad_token": "<||pad||>", "tokenizer_class": "GPT2Tokenizer", "unk_token": "" }