webbigdata-jp commited on
Commit
86b66f0
1 Parent(s): 07ab101

version3 upload

Browse files
README.md CHANGED
@@ -1,13 +1,13 @@
1
  ---
2
  library_name: peft
3
- base_model: unsloth/gemma-7b-bnb-4bit
4
  language:
5
  - ja
6
  - en
7
  tags:
8
  - translation
9
  - qlora
10
- - gemma
11
  - text-generation-inference
12
  - nlp
13
  ---
@@ -16,6 +16,17 @@ tags:
16
 
17
  # News
18
 
 
 
 
 
 
 
 
 
 
 
 
19
  ## 2024.05.17
20
  C3TR-AdapterのVersion2を公開しました。
21
  Version 2 of C3TR-Adapter has been released.
@@ -546,12 +557,12 @@ Any feedback would be appreciated!
546
  ### 謝辞 Acknowledgment
547
 
548
  Original Base Model
549
- google/gemma-7b
550
- https://huggingface.co/google/gemma-7b
551
 
552
  Base Model
553
  unsloth/gemma-7b-bnb-4bit
554
- https://huggingface.co/unsloth/gemma-7b-bnb-4bit
555
 
556
  QLoRA Adapter
557
  webbigdata/C3TR-Adapter
 
1
  ---
2
  library_name: peft
3
+ base_model: unsloth/gemma-2-9b-it-bnb-4bit
4
  language:
5
  - ja
6
  - en
7
  tags:
8
  - translation
9
  - qlora
10
+ - gemma2
11
  - text-generation-inference
12
  - nlp
13
  ---
 
16
 
17
  # News
18
 
19
+ ## 2024.07.19
20
+ C3TR-AdapterのVersion3を公開しました。
21
+ Version 3 of C3TR-Adapter has been released.
22
+
23
+ このドキュメント等は現在、差し替え作業中で一部古いです。
24
+ This documentation is currently being replaced and some parts are out of date.
25
+
26
+
27
+
28
+
29
+
30
  ## 2024.05.17
31
  C3TR-AdapterのVersion2を公開しました。
32
  Version 2 of C3TR-Adapter has been released.
 
557
  ### 謝辞 Acknowledgment
558
 
559
  Original Base Model
560
+ google/gemma-2-9b-it
561
+ https://huggingface.co/google/gemma-2-9b-it
562
 
563
  Base Model
564
  unsloth/gemma-7b-bnb-4bit
565
+ https://huggingface.co/unsloth/gemma-2-9b-it-bnb-4bit
566
 
567
  QLoRA Adapter
568
  webbigdata/C3TR-Adapter
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "unsloth/gemma-7b-bnb-4bit",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
@@ -10,23 +10,23 @@
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
- "lora_alpha": 32,
14
- "lora_dropout": 0.05,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
- "r": 64,
20
  "rank_pattern": {},
21
  "revision": "unsloth",
22
  "target_modules": [
23
- "o_proj",
 
24
  "k_proj",
25
- "q_proj",
26
- "down_proj",
27
  "up_proj",
28
- "gate_proj",
29
- "v_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "unsloth/gemma-2-9b-it-bnb-4bit",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
 
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
+ "lora_alpha": 64,
14
+ "lora_dropout": 0,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
+ "r": 128,
20
  "rank_pattern": {},
21
  "revision": "unsloth",
22
  "target_modules": [
23
+ "gate_proj",
24
+ "v_proj",
25
  "k_proj",
26
+ "o_proj",
 
27
  "up_proj",
28
+ "q_proj",
29
+ "down_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63574dfbad9845da5aaa22aa3344b88855f6e9ab3c33b90b2782bf8cd56bc1a7
3
- size 800116456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42eba5d7c8060d980d85c8e100ec5a6d6cbf1a6b044ab784660e0405feca5323
3
+ size 1728658208
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f30f819ff5b0f4cef2c8a6aafbeb20a13e7dd14409ece0f1e11e1d84bcfd281b
3
- size 17518937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd1df914b205b134e52f15364524a919423b48c9056d725b45c5b89187541de0
3
+ size 17518965
tokenizer_config.json CHANGED
@@ -1744,6 +1744,7 @@
1744
  "<end_of_turn>"
1745
  ],
1746
  "bos_token": "<bos>",
 
1747
  "clean_up_tokenization_spaces": false,
1748
  "eos_token": "<eos>",
1749
  "model_max_length": 8192,
 
1744
  "<end_of_turn>"
1745
  ],
1746
  "bos_token": "<bos>",
1747
+ "chat_template": "{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
1748
  "clean_up_tokenization_spaces": false,
1749
  "eos_token": "<eos>",
1750
  "model_max_length": 8192,