Commit message
Browse files- README.md +2 -6
- adapter_config.json +2 -2
- adapter_model.safetensors +1 -1
- runs/Nov09_09-17-24_ip-10-192-12-219/events.out.tfevents.1731143845.ip-10-192-12-219.117549.0 +3 -0
- runs/Nov09_09-26-40_ip-10-192-12-219/events.out.tfevents.1731144401.ip-10-192-12-219.117549.1 +3 -0
- runs/Nov09_09-29-40_ip-10-192-12-219/events.out.tfevents.1731144580.ip-10-192-12-219.117549.2 +3 -0
- runs/Nov09_09-56-07_ip-10-192-12-219/events.out.tfevents.1731146169.ip-10-192-12-219.181121.0 +3 -0
- runs/Nov09_09-59-21_ip-10-192-12-219/events.out.tfevents.1731146362.ip-10-192-12-219.181121.1 +3 -0
- runs/Nov09_10-01-40_ip-10-192-12-219/events.out.tfevents.1731146501.ip-10-192-12-219.181121.2 +3 -0
- runs/Nov09_10-04-49_ip-10-192-12-219/events.out.tfevents.1731146690.ip-10-192-12-219.181121.3 +3 -0
- runs/Nov09_12-49-26_ip-10-192-11-134/events.out.tfevents.1731156569.ip-10-192-11-134.1666.0 +3 -0
- runs/Nov09_13-00-15_ip-10-192-11-134/events.out.tfevents.1731157217.ip-10-192-11-134.15162.0 +3 -0
- runs/Nov09_13-16-26_ip-10-192-11-134/events.out.tfevents.1731158189.ip-10-192-11-134.36325.0 +3 -0
- runs/Nov09_13-27-17_ip-10-192-11-134/events.out.tfevents.1731158839.ip-10-192-11-134.50779.0 +3 -0
- runs/Nov09_13-32-54_ip-10-192-11-134/events.out.tfevents.1731159177.ip-10-192-11-134.58325.0 +3 -0
- runs/Nov09_13-34-32_ip-10-192-11-134/events.out.tfevents.1731159274.ip-10-192-11-134.60568.0 +3 -0
- runs/Nov09_13-36-14_ip-10-192-11-134/events.out.tfevents.1731159377.ip-10-192-11-134.62817.0 +3 -0
- tokenizer.json +2 -2
- training_args.bin +2 -2
README.md
CHANGED
@@ -41,19 +41,15 @@ The following hyperparameters were used during training:
|
|
41 |
- seed: 42
|
42 |
- gradient_accumulation_steps: 8
|
43 |
- total_train_batch_size: 32
|
44 |
-
- optimizer:
|
45 |
- lr_scheduler_type: constant
|
46 |
- lr_scheduler_warmup_ratio: 0.03
|
47 |
- num_epochs: 3
|
48 |
|
49 |
-
### Training results
|
50 |
-
|
51 |
-
|
52 |
-
|
53 |
### Framework versions
|
54 |
|
55 |
- PEFT 0.13.0
|
56 |
-
- Transformers 4.
|
57 |
- Pytorch 2.4.0+cu121
|
58 |
- Datasets 3.0.1
|
59 |
- Tokenizers 0.20.1
|
|
|
41 |
- seed: 42
|
42 |
- gradient_accumulation_steps: 8
|
43 |
- total_train_batch_size: 32
|
44 |
+
- optimizer: Use adamw_torch_fused with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
45 |
- lr_scheduler_type: constant
|
46 |
- lr_scheduler_warmup_ratio: 0.03
|
47 |
- num_epochs: 3
|
48 |
|
|
|
|
|
|
|
|
|
49 |
### Framework versions
|
50 |
|
51 |
- PEFT 0.13.0
|
52 |
+
- Transformers 4.46.2
|
53 |
- Pytorch 2.4.0+cu121
|
54 |
- Datasets 3.0.1
|
55 |
- Tokenizers 0.20.1
|
adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"v_proj",
|
24 |
+
"q_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 23641256
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d5c3fc263a5012355bc2a1c8e2701cbb93dbf7083de71e55f1cbd7f29349b46
|
3 |
size 23641256
|
runs/Nov09_09-17-24_ip-10-192-12-219/events.out.tfevents.1731143845.ip-10-192-12-219.117549.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:623ae07bc0481d0d566fad78bdb85f89bc42948fcb7460fd1b8c907c21dd70d1
|
3 |
+
size 10346
|
runs/Nov09_09-26-40_ip-10-192-12-219/events.out.tfevents.1731144401.ip-10-192-12-219.117549.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57e50aa9bd50678162a4e3efa86de578ff330fdb18b4f9dd9846d13ca9fde254
|
3 |
+
size 6046
|
runs/Nov09_09-29-40_ip-10-192-12-219/events.out.tfevents.1731144580.ip-10-192-12-219.117549.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bec367eeb00b1a84f7139acc9a73bd0324483a88bc34848cce74955b8a2c820
|
3 |
+
size 6046
|
runs/Nov09_09-56-07_ip-10-192-12-219/events.out.tfevents.1731146169.ip-10-192-12-219.181121.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbc7ab9ccdd50f53b3053c32ba272e3baa94e961db378bc19bd41099f22eec53
|
3 |
+
size 6047
|
runs/Nov09_09-59-21_ip-10-192-12-219/events.out.tfevents.1731146362.ip-10-192-12-219.181121.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ae452ac0c6c21dd29a2183b64a2cd9cf334079ba921a68518530053962a012b
|
3 |
+
size 6047
|
runs/Nov09_10-01-40_ip-10-192-12-219/events.out.tfevents.1731146501.ip-10-192-12-219.181121.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:deba96ae93b77219b83597011f3ab8b0ee6d44e80985d59e8d0f2e41e120f8d9
|
3 |
+
size 6047
|
runs/Nov09_10-04-49_ip-10-192-12-219/events.out.tfevents.1731146690.ip-10-192-12-219.181121.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6018e412e2b46bfaaaf1017051231af23e88c08f011979f969ffa9d184839900
|
3 |
+
size 6047
|
runs/Nov09_12-49-26_ip-10-192-11-134/events.out.tfevents.1731156569.ip-10-192-11-134.1666.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd64045a4e9b750c2ffc4e49632d0700f13c8d6f909c1e48665945b52b50c381
|
3 |
+
size 6047
|
runs/Nov09_13-00-15_ip-10-192-11-134/events.out.tfevents.1731157217.ip-10-192-11-134.15162.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df5db4cfc1f979f5463c818909ad141658bf0fde38503dae5191a7af8d593f24
|
3 |
+
size 10346
|
runs/Nov09_13-16-26_ip-10-192-11-134/events.out.tfevents.1731158189.ip-10-192-11-134.36325.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efd8e9d1ad9a023ba2dc44044c39f6b014ff939b9329bfdac94eb4a776b1496b
|
3 |
+
size 10543
|
runs/Nov09_13-27-17_ip-10-192-11-134/events.out.tfevents.1731158839.ip-10-192-11-134.50779.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:605bcf0f0466eb447092069065157b48f6e140ea12fff242547ba8f83cf6739e
|
3 |
+
size 10062
|
runs/Nov09_13-32-54_ip-10-192-11-134/events.out.tfevents.1731159177.ip-10-192-11-134.58325.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6374e83a43530f7bfb579e56b4ee8473a128d3e488765cab5a259c4063da414a
|
3 |
+
size 10062
|
runs/Nov09_13-34-32_ip-10-192-11-134/events.out.tfevents.1731159274.ip-10-192-11-134.60568.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdd2a5029f533d57e1fc3e32ba86ccfb5df60a1217c7a146ac6cdd1563169b93
|
3 |
+
size 10062
|
runs/Nov09_13-36-14_ip-10-192-11-134/events.out.tfevents.1731159377.ip-10-192-11-134.62817.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5781f84c5643d81e5d765b51dd151a9bc257922d754df75bf26d035cceb15748
|
3 |
+
size 10062
|
tokenizer.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9816d43bd5347d64bccc66b7710947fb18e9818cc660215b1462061d4a44e449
|
3 |
+
size 17210088
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540974c06f0e6342b8a99442a23bb28a0c06f97ca9b94c689f0aa0dc07fcda2f
|
3 |
+
size 5624
|