elplaguister commited on
Commit
e55ebbd
1 Parent(s): 14264ab

add tokenizer

Browse files
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"do_lower_case": false, "unk_token": "<unk>", "pad_token": "<pad>", "bos_token": "<s>", "eos_token": "</s>", "special_tokens_map_file": "/Users/elplaguister/.cache/huggingface/transformers/81bb172c5a6c70898d8a2e22cf133bb951e80e92f6f12d3bd4c6270bcfd8413f.9d6cd81ef646692fb1c169a880161ea1cb95f49694f220aced9b704b457e51dd", "name_or_path": "taeminlee/kogpt2", "tokenizer_class": "PreTrainedTokenizerFast"}