Hastagaras commited on
Commit
4c1f395
1 Parent(s): 9c0b6db

Upload tokenizer

Browse files
Files changed (3) hide show
  1. README.md +4 -5
  2. tokenizer.json +2 -2
  3. tokenizer_config.json +2 -5
README.md CHANGED
@@ -1,14 +1,13 @@
1
  ---
 
 
 
 
2
  base_model:
3
  - crestf411/gemma2-9B-sunfall-v0.5.2
4
  - Hastagaras/Gemma-Model1
5
  - IlyaGusev/gemma-2-9b-it-abliterated
6
  - Hastagaras/Gemmoy-9B-G2-MK.3
7
- library_name: transformers
8
- tags:
9
- - mergekit
10
- - merge
11
-
12
  ---
13
  i just realized it became 10b and I don't know why
14
 
 
1
  ---
2
+ library_name: transformers
3
+ tags:
4
+ - mergekit
5
+ - merge
6
  base_model:
7
  - crestf411/gemma2-9B-sunfall-v0.5.2
8
  - Hastagaras/Gemma-Model1
9
  - IlyaGusev/gemma-2-9b-it-abliterated
10
  - Hastagaras/Gemmoy-9B-G2-MK.3
 
 
 
 
 
11
  ---
12
  i just realized it became 10b and I don't know why
13
 
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6baaffa9d0e48eb225a65139caaa8f6dbeea24f43defeb29b7ee35d4d011716d
3
- size 17518679
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c15eb04bc5ad609fb26533e8525302c5640a945e5f67f65b7c849900acda7d99
3
+ size 17518497
tokenizer_config.json CHANGED
@@ -1744,14 +1744,11 @@
1744
  "<end_of_turn>"
1745
  ],
1746
  "bos_token": "<bos>",
1747
- "chat_template": "{% for message in messages -%}{%- if message['role'] == 'system' -%}<start_of_turn>user{{ '\n' }}{{ message['content'] | trim }}{%- if loop.nextitem is defined and loop.nextitem['role'] == 'user' %}{{ '\n\n' }}{{ loop.nextitem['content'] | trim }}<end_of_turn>{%- else -%}<end_of_turn>{%- endif -%}{%- elif message['role'] == 'user' and loop.previtem is defined and loop.previtem['role'] == 'system' -%}{# Skip this message as it was already included #}{%- else -%}<start_of_turn>{% if message['role'] == 'assistant' %}model{% else %}{{ message['role'] }}{% endif %}{{ '\n' }}{{ message['content'] | trim }}<end_of_turn>{%- endif -%}{%- if not loop.last and not (message['role'] == 'system' and loop.nextitem['role'] == 'user') -%}{{ '\n' }}{%- endif -%}{%- endfor -%}{%- if add_generation_prompt -%}{{ '\n' }}<start_of_turn>model{%- endif -%}", "clean_up_tokenization_spaces": false,
 
1748
  "eos_token": "<eos>",
1749
- "max_length": null,
1750
  "model_max_length": 1000000000000000019884624838656,
1751
- "pad_to_multiple_of": null,
1752
  "pad_token": "<pad>",
1753
- "pad_token_type_id": 0,
1754
- "padding_side": "left",
1755
  "sp_model_kwargs": {},
1756
  "spaces_between_special_tokens": false,
1757
  "tokenizer_class": "GemmaTokenizer",
 
1744
  "<end_of_turn>"
1745
  ],
1746
  "bos_token": "<bos>",
1747
+ "chat_template": "{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
1748
+ "clean_up_tokenization_spaces": false,
1749
  "eos_token": "<eos>",
 
1750
  "model_max_length": 1000000000000000019884624838656,
 
1751
  "pad_token": "<pad>",
 
 
1752
  "sp_model_kwargs": {},
1753
  "spaces_between_special_tokens": false,
1754
  "tokenizer_class": "GemmaTokenizer",