winglian commited on
Commit
5a7d172
1 Parent(s): 970a1e0

End of training

Browse files
README.md CHANGED
@@ -41,7 +41,7 @@ dataset_prepared_path: last_run_prepared
41
  val_set_size: 0.0
42
  output_dir: ./zephyr-deita-kto-3ep-v3-r512-bsz16-cosine
43
  save_total_limit: 3
44
- hub_model_id: openaccess-ai-collective/kto-zephyr-deita-nectar
45
 
46
  adapter: lora
47
  lora_model_dir:
@@ -71,6 +71,7 @@ wandb_watch:
71
  wandb_run_id:
72
  wandb_name: kto-3ep-v3-r512-bsz16-lr2e-5-cosine
73
  wandb_log_model:
 
74
 
75
  gradient_accumulation_steps: 1
76
  micro_batch_size: 4
@@ -101,7 +102,7 @@ warmup_steps: 10
101
  eval_steps:
102
  eval_table_size:
103
  eval_table_max_new_tokens: 128
104
- save_steps: 45
105
  debug:
106
  deepspeed:
107
  weight_decay: 0.1
 
41
  val_set_size: 0.0
42
  output_dir: ./zephyr-deita-kto-3ep-v3-r512-bsz16-cosine
43
  save_total_limit: 3
44
+ hub_model_id: openaccess-ai-collective/kto-zephyr-deita-nectar-final
45
 
46
  adapter: lora
47
  lora_model_dir:
 
71
  wandb_run_id:
72
  wandb_name: kto-3ep-v3-r512-bsz16-lr2e-5-cosine
73
  wandb_log_model:
74
+ wandb_disabled: true
75
 
76
  gradient_accumulation_steps: 1
77
  micro_batch_size: 4
 
102
  eval_steps:
103
  eval_table_size:
104
  eval_table_max_new_tokens: 128
105
+ save_steps: 538
106
  debug:
107
  deepspeed:
108
  weight_decay: 0.1
adapter_config.json CHANGED
@@ -19,13 +19,13 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "k_proj",
 
23
  "v_proj",
24
- "gate_proj",
25
- "o_proj",
26
  "down_proj",
27
- "up_proj",
28
- "q_proj"
29
  ],
30
  "task_type": "CAUSAL_LM"
31
  }
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "q_proj",
23
+ "up_proj",
24
  "v_proj",
25
+ "k_proj",
 
26
  "down_proj",
27
+ "gate_proj",
28
+ "o_proj"
29
  ],
30
  "task_type": "CAUSAL_LM"
31
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec4f8cf2b6a4204853a331e473f23e8d26041b30fa0d2f9c11cfdc59e9d21f3e
3
  size 2684416656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:732d21eeae0ee42bd4ad4a9aa804e58a6945cbed403308429d5d94817ce607b2
3
  size 2684416656
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:147669fa0462cd395aa92ff8b9f22509f2b014efcdcda45d18659d4664983b06
3
  size 4998883808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1674b9b4f0413adf06d88c4ac4aa2bf0751667544b51f7c8d4e08129ccace44
3
  size 4998883808
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:343046f9a27124fe51eacf8f8be4d29959555983d1641b623eab92e0ba71f1d4
3
  size 4994690208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a6e388946c4bf74de56ad6b73d0c492f8820391403dcb26ce403fff6454a91f
3
  size 4994690208
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b2520dd1820a88d7ae2691983034daeda484a2ec3dfbe2cae9cd893f404067e
3
  size 4943343656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ea97897f66d227a4795bc8845b4024d3dcfd4fb4351a826f2bc85f83cc9d8a0
3
  size 4943343656
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5b59355c8f33b3e51d4d95a4dfa7b0bc831740b3b7256d6354b631d00959a6c
3
  size 2231527536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9f363cb120dacb47a00a295f5725d3266eec6e1edf05450ee1700d55ec388df
3
  size 2231527536
runs/Jan17_12-57-58_b5637b3f66b9/events.out.tfevents.1705496304.b5637b3f66b9.192182.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a78a772f08288884adb7eb906bb1f7470953b766a4f1eace4560e97ba9883f7d
3
+ size 1027366
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ec29747464712a616140f12ef0e55613e49edeb538160f5067ba009a2034e2d
3
  size 4347
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be67dbef5b3c10094536a0c6180766dc826b73e957941b276260a52f10b47b1b
3
  size 4347