danielhanchen commited on
Commit
819c677
1 Parent(s): 05ff320

Upload tokenizer

Browse files
Files changed (2) hide show
  1. README.md +0 -1
  2. tokenizer_config.json +1 -2
README.md CHANGED
@@ -8,7 +8,6 @@ tags:
8
  - transformers
9
  - gemma
10
  - bnb
11
-
12
  ---
13
 
14
  # Finetune Mistral, Gemma, Llama 2-5x faster with 70% less memory via Unsloth!
 
8
  - transformers
9
  - gemma
10
  - bnb
 
11
  ---
12
 
13
  # Finetune Mistral, Gemma, Llama 2-5x faster with 70% less memory via Unsloth!
tokenizer_config.json CHANGED
@@ -1743,9 +1743,8 @@
1743
  "chat_template": "{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
1744
  "clean_up_tokenization_spaces": false,
1745
  "eos_token": "<eos>",
1746
- "model_max_length": 8192,
1747
  "pad_token": "<pad>",
1748
- "padding_side": "right",
1749
  "sp_model_kwargs": {},
1750
  "spaces_between_special_tokens": false,
1751
  "tokenizer_class": "GemmaTokenizer",
 
1743
  "chat_template": "{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
1744
  "clean_up_tokenization_spaces": false,
1745
  "eos_token": "<eos>",
1746
+ "model_max_length": 1000000000000000019884624838656,
1747
  "pad_token": "<pad>",
 
1748
  "sp_model_kwargs": {},
1749
  "spaces_between_special_tokens": false,
1750
  "tokenizer_class": "GemmaTokenizer",