End of training
Browse files- README.md +3 -2
- adapter_config.json +5 -5
- adapter_model.safetensors +1 -1
- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- runs/Jan17_12-57-58_b5637b3f66b9/events.out.tfevents.1705496304.b5637b3f66b9.192182.0 +3 -0
- training_args.bin +1 -1
README.md
CHANGED
@@ -41,7 +41,7 @@ dataset_prepared_path: last_run_prepared
|
|
41 |
val_set_size: 0.0
|
42 |
output_dir: ./zephyr-deita-kto-3ep-v3-r512-bsz16-cosine
|
43 |
save_total_limit: 3
|
44 |
-
hub_model_id: openaccess-ai-collective/kto-zephyr-deita-nectar
|
45 |
|
46 |
adapter: lora
|
47 |
lora_model_dir:
|
@@ -71,6 +71,7 @@ wandb_watch:
|
|
71 |
wandb_run_id:
|
72 |
wandb_name: kto-3ep-v3-r512-bsz16-lr2e-5-cosine
|
73 |
wandb_log_model:
|
|
|
74 |
|
75 |
gradient_accumulation_steps: 1
|
76 |
micro_batch_size: 4
|
@@ -101,7 +102,7 @@ warmup_steps: 10
|
|
101 |
eval_steps:
|
102 |
eval_table_size:
|
103 |
eval_table_max_new_tokens: 128
|
104 |
-
save_steps:
|
105 |
debug:
|
106 |
deepspeed:
|
107 |
weight_decay: 0.1
|
|
|
41 |
val_set_size: 0.0
|
42 |
output_dir: ./zephyr-deita-kto-3ep-v3-r512-bsz16-cosine
|
43 |
save_total_limit: 3
|
44 |
+
hub_model_id: openaccess-ai-collective/kto-zephyr-deita-nectar-final
|
45 |
|
46 |
adapter: lora
|
47 |
lora_model_dir:
|
|
|
71 |
wandb_run_id:
|
72 |
wandb_name: kto-3ep-v3-r512-bsz16-lr2e-5-cosine
|
73 |
wandb_log_model:
|
74 |
+
wandb_disabled: true
|
75 |
|
76 |
gradient_accumulation_steps: 1
|
77 |
micro_batch_size: 4
|
|
|
102 |
eval_steps:
|
103 |
eval_table_size:
|
104 |
eval_table_max_new_tokens: 128
|
105 |
+
save_steps: 538
|
106 |
debug:
|
107 |
deepspeed:
|
108 |
weight_decay: 0.1
|
adapter_config.json
CHANGED
@@ -19,13 +19,13 @@
|
|
19 |
"rank_pattern": {},
|
20 |
"revision": null,
|
21 |
"target_modules": [
|
22 |
-
"
|
|
|
23 |
"v_proj",
|
24 |
-
"
|
25 |
-
"o_proj",
|
26 |
"down_proj",
|
27 |
-
"
|
28 |
-
"
|
29 |
],
|
30 |
"task_type": "CAUSAL_LM"
|
31 |
}
|
|
|
19 |
"rank_pattern": {},
|
20 |
"revision": null,
|
21 |
"target_modules": [
|
22 |
+
"q_proj",
|
23 |
+
"up_proj",
|
24 |
"v_proj",
|
25 |
+
"k_proj",
|
|
|
26 |
"down_proj",
|
27 |
+
"gate_proj",
|
28 |
+
"o_proj"
|
29 |
],
|
30 |
"task_type": "CAUSAL_LM"
|
31 |
}
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2684416656
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:732d21eeae0ee42bd4ad4a9aa804e58a6945cbed403308429d5d94817ce607b2
|
3 |
size 2684416656
|
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4998883808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1674b9b4f0413adf06d88c4ac4aa2bf0751667544b51f7c8d4e08129ccace44
|
3 |
size 4998883808
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4994690208
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a6e388946c4bf74de56ad6b73d0c492f8820391403dcb26ce403fff6454a91f
|
3 |
size 4994690208
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943343656
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ea97897f66d227a4795bc8845b4024d3dcfd4fb4351a826f2bc85f83cc9d8a0
|
3 |
size 4943343656
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2231527536
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9f363cb120dacb47a00a295f5725d3266eec6e1edf05450ee1700d55ec388df
|
3 |
size 2231527536
|
runs/Jan17_12-57-58_b5637b3f66b9/events.out.tfevents.1705496304.b5637b3f66b9.192182.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a78a772f08288884adb7eb906bb1f7470953b766a4f1eace4560e97ba9883f7d
|
3 |
+
size 1027366
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4347
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be67dbef5b3c10094536a0c6180766dc826b73e957941b276260a52f10b47b1b
|
3 |
size 4347
|