Upload tokenizer
Browse files- README.md +1 -1
- tokenizer.json +1 -0
- tokenizer_config.json +3 -1
README.md
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
---
|
2 |
-
license: mit
|
3 |
language:
|
4 |
- en
|
|
|
5 |
---
|
6 |
|
7 |
## Model Summary
|
|
|
1 |
---
|
|
|
2 |
language:
|
3 |
- en
|
4 |
+
license: mit
|
5 |
---
|
6 |
|
7 |
## Model Summary
|
tokenizer.json
CHANGED
@@ -276556,6 +276556,7 @@
|
|
276556 |
"end_of_word_suffix": "",
|
276557 |
"fuse_unk": false,
|
276558 |
"byte_fallback": false,
|
|
|
276559 |
"vocab": {
|
276560 |
"!": 0,
|
276561 |
"\"": 1,
|
|
|
276556 |
"end_of_word_suffix": "",
|
276557 |
"fuse_unk": false,
|
276558 |
"byte_fallback": false,
|
276559 |
+
"ignore_merges": false,
|
276560 |
"vocab": {
|
276561 |
"!": 0,
|
276562 |
"\"": 1,
|
tokenizer_config.json
CHANGED
@@ -245803,11 +245803,13 @@
|
|
245803 |
}
|
245804 |
},
|
245805 |
"bos_token": "<|endoftext|>",
|
245806 |
-
"chat_template": "{% for message in messages %}
|
245807 |
"clean_up_tokenization_spaces": true,
|
|
|
245808 |
"eos_token": "<|endoftext|>",
|
245809 |
"model_max_length": 2048,
|
245810 |
"pad_token": "<pad>",
|
|
|
245811 |
"tokenizer_class": "CodeGenTokenizer",
|
245812 |
"unk_token": "<|endoftext|>"
|
245813 |
}
|
|
|
245803 |
}
|
245804 |
},
|
245805 |
"bos_token": "<|endoftext|>",
|
245806 |
+
"chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<|im_start|>user\\n' + message['content'].strip() + ' <|im_end|>' }}{% elif message['role'] == 'system' %}{{ '<|im_start|>system\\n' + message['content'].strip() + '<|im_end|>\\n' }}{% elif message['role'] == 'assistant' %}{{ '<|im_start|>assistant \\n' + message['content'] + ' <|im_end|>'}}{% endif %}{% endfor %}",
|
245807 |
"clean_up_tokenization_spaces": true,
|
245808 |
+
"device_map": "auto",
|
245809 |
"eos_token": "<|endoftext|>",
|
245810 |
"model_max_length": 2048,
|
245811 |
"pad_token": "<pad>",
|
245812 |
+
"return_token_type_ids": false,
|
245813 |
"tokenizer_class": "CodeGenTokenizer",
|
245814 |
"unk_token": "<|endoftext|>"
|
245815 |
}
|