Qwen2.5-14B-Instruct_16
Browse files- README.md +2 -2
- adapter_config.json +5 -5
- adapter_model.safetensors +1 -1
- added_tokens.json +0 -1
- special_tokens_map.json +1 -1
- tokenizer.json +2 -2
- tokenizer_config.json +1 -9
- training_args.bin +1 -1
README.md
CHANGED
@@ -28,7 +28,7 @@ print(output["generated_text"])
|
|
28 |
|
29 |
## Training procedure
|
30 |
|
31 |
-
[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/radchenko-pn-ukrainian-catholic-university/NER_SFT/runs/
|
32 |
|
33 |
|
34 |
This model was trained with SFT.
|
@@ -36,7 +36,7 @@ This model was trained with SFT.
|
|
36 |
### Framework versions
|
37 |
|
38 |
- TRL: 0.14.0
|
39 |
-
- Transformers: 4.
|
40 |
- Pytorch: 2.5.1+cu124
|
41 |
- Datasets: 3.2.0
|
42 |
- Tokenizers: 0.21.0
|
|
|
28 |
|
29 |
## Training procedure
|
30 |
|
31 |
+
[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/radchenko-pn-ukrainian-catholic-university/NER_SFT/runs/ax4zjmnd)
|
32 |
|
33 |
|
34 |
This model was trained with SFT.
|
|
|
36 |
### Framework versions
|
37 |
|
38 |
- TRL: 0.14.0
|
39 |
+
- Transformers: 4.47.1
|
40 |
- Pytorch: 2.5.1+cu124
|
41 |
- Datasets: 3.2.0
|
42 |
- Tokenizers: 0.21.0
|
adapter_config.json
CHANGED
@@ -23,13 +23,13 @@
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
26 |
-
"
|
27 |
-
"o_proj",
|
28 |
-
"down_proj",
|
29 |
-
"up_proj",
|
30 |
"q_proj",
|
|
|
31 |
"v_proj",
|
32 |
-
"
|
|
|
|
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
26 |
+
"gate_proj",
|
|
|
|
|
|
|
27 |
"q_proj",
|
28 |
+
"k_proj",
|
29 |
"v_proj",
|
30 |
+
"up_proj",
|
31 |
+
"o_proj",
|
32 |
+
"down_proj"
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 275341720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:422af23f4ae5b3b82d760f3506a9238e6846e74ca787b33b93de4e57a389c9f3
|
3 |
size 275341720
|
added_tokens.json
CHANGED
@@ -1,7 +1,6 @@
|
|
1 |
{
|
2 |
"</tool_call>": 151658,
|
3 |
"<tool_call>": 151657,
|
4 |
-
"<|PAD_TOKEN|>": 151665,
|
5 |
"<|box_end|>": 151649,
|
6 |
"<|box_start|>": 151648,
|
7 |
"<|endoftext|>": 151643,
|
|
|
1 |
{
|
2 |
"</tool_call>": 151658,
|
3 |
"<tool_call>": 151657,
|
|
|
4 |
"<|box_end|>": 151649,
|
5 |
"<|box_start|>": 151648,
|
6 |
"<|endoftext|>": 151643,
|
special_tokens_map.json
CHANGED
@@ -22,7 +22,7 @@
|
|
22 |
"single_word": false
|
23 |
},
|
24 |
"pad_token": {
|
25 |
-
"content": "<|
|
26 |
"lstrip": false,
|
27 |
"normalized": false,
|
28 |
"rstrip": false,
|
|
|
22 |
"single_word": false
|
23 |
},
|
24 |
"pad_token": {
|
25 |
+
"content": "<|vision_pad|>",
|
26 |
"lstrip": false,
|
27 |
"normalized": false,
|
28 |
"rstrip": false,
|
tokenizer.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
|
3 |
+
size 11421896
|
tokenizer_config.json
CHANGED
@@ -177,14 +177,6 @@
|
|
177 |
"rstrip": false,
|
178 |
"single_word": false,
|
179 |
"special": false
|
180 |
-
},
|
181 |
-
"151665": {
|
182 |
-
"content": "<|PAD_TOKEN|>",
|
183 |
-
"lstrip": false,
|
184 |
-
"normalized": false,
|
185 |
-
"rstrip": false,
|
186 |
-
"single_word": false,
|
187 |
-
"special": true
|
188 |
}
|
189 |
},
|
190 |
"additional_special_tokens": [
|
@@ -209,7 +201,7 @@
|
|
209 |
"errors": "replace",
|
210 |
"extra_special_tokens": {},
|
211 |
"model_max_length": 32768,
|
212 |
-
"pad_token": "<|
|
213 |
"padding_side": "right",
|
214 |
"split_special_tokens": false,
|
215 |
"tokenizer_class": "Qwen2Tokenizer",
|
|
|
177 |
"rstrip": false,
|
178 |
"single_word": false,
|
179 |
"special": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
180 |
}
|
181 |
},
|
182 |
"additional_special_tokens": [
|
|
|
201 |
"errors": "replace",
|
202 |
"extra_special_tokens": {},
|
203 |
"model_max_length": 32768,
|
204 |
+
"pad_token": "<|vision_pad|>",
|
205 |
"padding_side": "right",
|
206 |
"split_special_tokens": false,
|
207 |
"tokenizer_class": "Qwen2Tokenizer",
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5624
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9045f2a71bf96bc6d055f6e755138fc6861427ada644b759baf0b7465a54575
|
3 |
size 5624
|