Model save
Browse files- README.md +1 -1
- adapter_config.json +17 -17
- adapter_model.safetensors +1 -1
- training_args.bin +1 -1
README.md
CHANGED
@@ -40,7 +40,7 @@ The following hyperparameters were used during training:
|
|
40 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
41 |
- lr_scheduler_type: cosine
|
42 |
- lr_scheduler_warmup_steps: 5
|
43 |
-
- training_steps:
|
44 |
|
45 |
### Training results
|
46 |
|
|
|
40 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
41 |
- lr_scheduler_type: cosine
|
42 |
- lr_scheduler_warmup_steps: 5
|
43 |
+
- training_steps: 30
|
44 |
|
45 |
### Training results
|
46 |
|
adapter_config.json
CHANGED
@@ -20,30 +20,30 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"transformer.h.5.mlp.c_fc",
|
24 |
-
"transformer.h.5.mlp.c_proj",
|
25 |
-
"transformer.h.2.mlp.c_proj",
|
26 |
-
"transformer.h.0.mlp.c_fc",
|
27 |
-
"transformer.h.0.attn.c_attn",
|
28 |
"transformer.h.2.attn.c_proj",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
29 |
"transformer.h.1.mlp.c_proj",
|
30 |
-
"transformer.h.
|
31 |
-
"transformer.h.3.mlp.c_fc",
|
32 |
-
"transformer.h.4.attn.c_attn",
|
33 |
"transformer.h.3.attn.c_proj",
|
|
|
34 |
"transformer.h.5.attn.c_proj",
|
35 |
-
"transformer.h.
|
36 |
"transformer.h.1.attn.c_proj",
|
|
|
|
|
37 |
"transformer.h.5.attn.c_attn",
|
38 |
-
"transformer.h.
|
39 |
-
"transformer.h.2.attn.c_attn",
|
40 |
-
"transformer.h.3.attn.c_attn",
|
41 |
-
"transformer.h.0.attn.c_proj",
|
42 |
-
"transformer.h.4.mlp.c_fc",
|
43 |
-
"transformer.h.2.mlp.c_fc",
|
44 |
"transformer.h.3.mlp.c_proj",
|
45 |
-
"transformer.h.4.attn.
|
46 |
-
"transformer.h.
|
|
|
|
|
47 |
],
|
48 |
"task_type": "CAUSAL_LM",
|
49 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
|
|
|
|
|
|
|
|
|
|
23 |
"transformer.h.2.attn.c_proj",
|
24 |
+
"transformer.h.0.attn.c_proj",
|
25 |
+
"transformer.h.0.mlp.c_proj",
|
26 |
+
"transformer.h.1.attn.c_attn",
|
27 |
+
"transformer.h.4.mlp.c_fc",
|
28 |
+
"transformer.h.5.mlp.c_fc",
|
29 |
+
"transformer.h.3.attn.c_attn",
|
30 |
+
"transformer.h.2.attn.c_attn",
|
31 |
"transformer.h.1.mlp.c_proj",
|
32 |
+
"transformer.h.2.mlp.c_fc",
|
|
|
|
|
33 |
"transformer.h.3.attn.c_proj",
|
34 |
+
"transformer.h.4.attn.c_proj",
|
35 |
"transformer.h.5.attn.c_proj",
|
36 |
+
"transformer.h.0.mlp.c_fc",
|
37 |
"transformer.h.1.attn.c_proj",
|
38 |
+
"transformer.h.1.mlp.c_fc",
|
39 |
+
"transformer.h.0.attn.c_attn",
|
40 |
"transformer.h.5.attn.c_attn",
|
41 |
+
"transformer.h.3.mlp.c_fc",
|
|
|
|
|
|
|
|
|
|
|
42 |
"transformer.h.3.mlp.c_proj",
|
43 |
+
"transformer.h.4.attn.c_attn",
|
44 |
+
"transformer.h.2.mlp.c_proj",
|
45 |
+
"transformer.h.5.mlp.c_proj",
|
46 |
+
"transformer.h.4.mlp.c_proj"
|
47 |
],
|
48 |
"task_type": "CAUSAL_LM",
|
49 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2365304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:313174a13db3decbfdb8cc89ca7bf90b3b0a449053671b790cd0670f6c2fa00b
|
3 |
size 2365304
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5112
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58c2d8043c93feda75c4844001deaf3b934b34158ab14a6bcf4e66560335330a
|
3 |
size 5112
|