Training in progress, step 10000
Browse files
adapter_config.json
CHANGED
@@ -22,13 +22,13 @@
|
|
22 |
"rank_pattern": {},
|
23 |
"revision": null,
|
24 |
"target_modules": [
|
25 |
-
"q_proj",
|
26 |
-
"o_proj",
|
27 |
-
"gate_proj",
|
28 |
-
"k_proj",
|
29 |
"v_proj",
|
|
|
|
|
|
|
30 |
"down_proj",
|
31 |
-
"
|
|
|
32 |
],
|
33 |
"task_type": "CAUSAL_LM",
|
34 |
"use_dora": false,
|
|
|
22 |
"rank_pattern": {},
|
23 |
"revision": null,
|
24 |
"target_modules": [
|
|
|
|
|
|
|
|
|
25 |
"v_proj",
|
26 |
+
"k_proj",
|
27 |
+
"q_proj",
|
28 |
+
"up_proj",
|
29 |
"down_proj",
|
30 |
+
"o_proj",
|
31 |
+
"gate_proj"
|
32 |
],
|
33 |
"task_type": "CAUSAL_LM",
|
34 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2460946960
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86c419900cb0220667f19da28f719e5c572cb4a4203f167e798ddd4de63a350d
|
3 |
size 2460946960
|
runs/May11_14-07-26_94b28b3b7833/events.out.tfevents.1715436487.94b28b3b7833.176.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:953f924a8b64d10065bb8b390615f3b8649abc8dabb24cbd8f21faa3c8c01fe5
|
3 |
+
size 5885
|
tokenizer.json
CHANGED
@@ -460,10 +460,30 @@
|
|
460 |
"use_regex": true
|
461 |
},
|
462 |
"post_processor": {
|
463 |
-
"type": "
|
464 |
-
"
|
465 |
-
|
466 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
467 |
},
|
468 |
"decoder": {
|
469 |
"type": "ByteLevel",
|
@@ -479,6 +499,7 @@
|
|
479 |
"end_of_word_suffix": null,
|
480 |
"fuse_unk": false,
|
481 |
"byte_fallback": false,
|
|
|
482 |
"vocab": {
|
483 |
"<|endoftext|>": 0,
|
484 |
"<|padding|>": 1,
|
|
|
460 |
"use_regex": true
|
461 |
},
|
462 |
"post_processor": {
|
463 |
+
"type": "TemplateProcessing",
|
464 |
+
"single": [
|
465 |
+
{
|
466 |
+
"Sequence": {
|
467 |
+
"id": "A",
|
468 |
+
"type_id": 0
|
469 |
+
}
|
470 |
+
}
|
471 |
+
],
|
472 |
+
"pair": [
|
473 |
+
{
|
474 |
+
"Sequence": {
|
475 |
+
"id": "A",
|
476 |
+
"type_id": 0
|
477 |
+
}
|
478 |
+
},
|
479 |
+
{
|
480 |
+
"Sequence": {
|
481 |
+
"id": "B",
|
482 |
+
"type_id": 1
|
483 |
+
}
|
484 |
+
}
|
485 |
+
],
|
486 |
+
"special_tokens": {}
|
487 |
},
|
488 |
"decoder": {
|
489 |
"type": "ByteLevel",
|
|
|
499 |
"end_of_word_suffix": null,
|
500 |
"fuse_unk": false,
|
501 |
"byte_fallback": false,
|
502 |
+
"ignore_merges": false,
|
503 |
"vocab": {
|
504 |
"<|endoftext|>": 0,
|
505 |
"<|padding|>": 1,
|
tokenizer_config.json
CHANGED
@@ -1,4 +1,6 @@
|
|
1 |
{
|
|
|
|
|
2 |
"add_prefix_space": false,
|
3 |
"added_tokens_decoder": {
|
4 |
"0": {
|
|
|
1 |
{
|
2 |
+
"add_bos_token": false,
|
3 |
+
"add_eos_token": false,
|
4 |
"add_prefix_space": false,
|
5 |
"added_tokens_decoder": {
|
6 |
"0": {
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8db781c44455fe7bb96fd2029b04467c270de7d9e62308b5ab26aef36cf86797
|
3 |
+
size 5048
|