voidful commited on
Commit
cf614a4
1 Parent(s): ab8ffc0

Upload tokenizer

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. tokenizer.json +1 -0
  3. tokenizer_config.json +3 -1
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
- license: mit
3
  language:
4
  - en
 
5
  ---
6
 
7
  ## Model Summary
 
1
  ---
 
2
  language:
3
  - en
4
+ license: mit
5
  ---
6
 
7
  ## Model Summary
tokenizer.json CHANGED
@@ -276556,6 +276556,7 @@
276556
  "end_of_word_suffix": "",
276557
  "fuse_unk": false,
276558
  "byte_fallback": false,
 
276559
  "vocab": {
276560
  "!": 0,
276561
  "\"": 1,
 
276556
  "end_of_word_suffix": "",
276557
  "fuse_unk": false,
276558
  "byte_fallback": false,
276559
+ "ignore_merges": false,
276560
  "vocab": {
276561
  "!": 0,
276562
  "\"": 1,
tokenizer_config.json CHANGED
@@ -245803,11 +245803,13 @@
245803
  }
245804
  },
245805
  "bos_token": "<|endoftext|>",
245806
- "chat_template": "{% for message in messages %}\n {% if message['role'] == 'assistant' %}\n {% if messages|length > 1 %}\n {{- '<|im_start|>assistant\\n' -}}\n {% endif %}\n {{- message['content'] + '<|im_end|>\\n' -}}\n {% else %}\n {{- '<|im_start|>' + message['role'] + '\\n' + message['content'] + '<|im_end|>\\n' -}}\n {% endif %}\n{% endfor %}\n{% if add_generation_prompt %}\n {{- '<|im_start|>assistant\\n' -}}\n{% endif %}\n",
245807
  "clean_up_tokenization_spaces": true,
 
245808
  "eos_token": "<|endoftext|>",
245809
  "model_max_length": 2048,
245810
  "pad_token": "<pad>",
 
245811
  "tokenizer_class": "CodeGenTokenizer",
245812
  "unk_token": "<|endoftext|>"
245813
  }
 
245803
  }
245804
  },
245805
  "bos_token": "<|endoftext|>",
245806
+ "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<|im_start|>user\\n' + message['content'].strip() + ' <|im_end|>' }}{% elif message['role'] == 'system' %}{{ '<|im_start|>system\\n' + message['content'].strip() + '<|im_end|>\\n' }}{% elif message['role'] == 'assistant' %}{{ '<|im_start|>assistant \\n' + message['content'] + ' <|im_end|>'}}{% endif %}{% endfor %}",
245807
  "clean_up_tokenization_spaces": true,
245808
+ "device_map": "auto",
245809
  "eos_token": "<|endoftext|>",
245810
  "model_max_length": 2048,
245811
  "pad_token": "<pad>",
245812
+ "return_token_type_ids": false,
245813
  "tokenizer_class": "CodeGenTokenizer",
245814
  "unk_token": "<|endoftext|>"
245815
  }