Model save
Browse files
.ipynb_checkpoints/adapter_config-checkpoint.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"alpha_pattern": {},
|
3 |
+
"auto_mapping": null,
|
4 |
+
"base_model_name_or_path": "NousResearch/Hermes-2-Pro-Mistral-7B",
|
5 |
+
"bias": "none",
|
6 |
+
"fan_in_fan_out": false,
|
7 |
+
"inference_mode": true,
|
8 |
+
"init_lora_weights": true,
|
9 |
+
"layers_pattern": null,
|
10 |
+
"layers_to_transform": null,
|
11 |
+
"loftq_config": {},
|
12 |
+
"lora_alpha": 128,
|
13 |
+
"lora_dropout": 0.05,
|
14 |
+
"megatron_config": null,
|
15 |
+
"megatron_core": "megatron.core",
|
16 |
+
"modules_to_save": [
|
17 |
+
"lm_head"
|
18 |
+
],
|
19 |
+
"peft_type": "LORA",
|
20 |
+
"r": 256,
|
21 |
+
"rank_pattern": {},
|
22 |
+
"revision": null,
|
23 |
+
"target_modules": [
|
24 |
+
"o_proj",
|
25 |
+
"up_proj",
|
26 |
+
"q_proj",
|
27 |
+
"down_proj",
|
28 |
+
"gate_proj",
|
29 |
+
"v_proj",
|
30 |
+
"k_proj"
|
31 |
+
],
|
32 |
+
"task_type": "CAUSAL_LM",
|
33 |
+
"use_rslora": false
|
34 |
+
}
|
.ipynb_checkpoints/added_tokens-checkpoint.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<pad10>": 32010,
|
3 |
+
"<pad11>": 32011,
|
4 |
+
"<pad12>": 32012,
|
5 |
+
"<pad13>": 32013,
|
6 |
+
"<pad14>": 32014,
|
7 |
+
"<pad15>": 32015,
|
8 |
+
"<pad16>": 32016,
|
9 |
+
"<pad17>": 32017,
|
10 |
+
"<pad18>": 32018,
|
11 |
+
"<pad19>": 32019,
|
12 |
+
"<pad20>": 32020,
|
13 |
+
"<pad21>": 32021,
|
14 |
+
"<pad22>": 32022,
|
15 |
+
"<pad23>": 32023,
|
16 |
+
"<pad24>": 32024,
|
17 |
+
"<pad25>": 32025,
|
18 |
+
"<pad26>": 32026,
|
19 |
+
"<pad27>": 32027,
|
20 |
+
"<pad28>": 32028,
|
21 |
+
"<pad29>": 32029,
|
22 |
+
"<pad2>": 32002,
|
23 |
+
"<pad30>": 32030,
|
24 |
+
"<pad31>": 32031,
|
25 |
+
"<pad3>": 32003,
|
26 |
+
"<pad4>": 32004,
|
27 |
+
"<pad5>": 32005,
|
28 |
+
"<pad6>": 32006,
|
29 |
+
"<pad7>": 32007,
|
30 |
+
"<pad8>": 32008,
|
31 |
+
"<pad9>": 32009,
|
32 |
+
"<|im_end|>": 32000,
|
33 |
+
"<|im_start|>": 32001
|
34 |
+
}
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1604645504
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcfde312f99adf0e68f08d150a9d2464cb54cf8d4685eac79df7785e4b0ea9e1
|
3 |
size 1604645504
|
runs/Apr17_01-49-10_ubuntu2204/events.out.tfevents.1713332953.ubuntu2204.15251.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4571f3c1f4d921cd965d1fdad609c9ea19a49f962f0e42830869789852f79595
|
3 |
+
size 6671
|