BobaZooba commited on
Commit
0abb464
1 Parent(s): a82b5b5

Training in progress, step 50

Browse files
adapter_config.json CHANGED
@@ -16,11 +16,11 @@
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
19
- "v_proj",
20
- "up_proj",
21
  "o_proj",
22
- "q_proj",
23
  "k_proj",
 
 
 
24
  "down_proj",
25
  "gate_proj"
26
  ],
 
16
  "rank_pattern": {},
17
  "revision": null,
18
  "target_modules": [
 
 
19
  "o_proj",
 
20
  "k_proj",
21
+ "up_proj",
22
+ "v_proj",
23
+ "q_proj",
24
  "down_proj",
25
  "gate_proj"
26
  ],
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e96bea56ea6f3915bfe03b9e3656bd65c93a3ea97b18a5775dc5f0e84d2faa4
3
  size 42002136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1d26ae4d91ee5406ecdb04754fcb794c49fdbf6bbb41861d8558309f1105dad
3
  size 42002136
runs/Dec06_11-57-16_18bca800423a/events.out.tfevents.1701864004.18bca800423a.4241.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00992b7756e3cc228180c6072d14a88bb7a02bd5c6454c89dd3c9d65eab8504a
3
+ size 13546
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0aca71db67798b119d2c3693b55cd6a103898a7e935aaf7759e9079b3f6bc999
3
- size 6264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3b4ec3761ef4757a95a527eb558426cc30befdddfb2e65ccd9b15755214e1aa
3
+ size 6328
training_config.json CHANGED
@@ -9,7 +9,9 @@
9
  "force_fp16": false,
10
  "from_gptq": false,
11
  "huggingface_hub_token": null,
12
- "deepspeed_stage": 2,
 
 
13
  "deepspeed_config_path": null,
14
  "fsdp_strategy": "",
15
  "fsdp_offload": true,
@@ -76,13 +78,14 @@
76
  "weight_decay": 0.001,
77
  "label_smoothing_factor": 0.0,
78
  "logging_steps": 1,
79
- "save_steps": 25,
80
  "save_total_limit": 1,
81
  "optim": "paged_adamw_8bit",
82
  "push_to_hub": true,
83
  "hub_model_id": "BobaZooba/AntModel-7B-XLLM-Demo-LoRA",
84
  "hub_private_repo": false,
85
  "neftune_noise_alpha": null,
 
86
  "report_to_wandb": false,
87
  "wandb_api_key": null,
88
  "wandb_project": null,
 
9
  "force_fp16": false,
10
  "from_gptq": false,
11
  "huggingface_hub_token": null,
12
+ "single_gpu": true,
13
+ "master_port": 9994,
14
+ "deepspeed_stage": "stage_2",
15
  "deepspeed_config_path": null,
16
  "fsdp_strategy": "",
17
  "fsdp_offload": true,
 
78
  "weight_decay": 0.001,
79
  "label_smoothing_factor": 0.0,
80
  "logging_steps": 1,
81
+ "save_steps": 50,
82
  "save_total_limit": 1,
83
  "optim": "paged_adamw_8bit",
84
  "push_to_hub": true,
85
  "hub_model_id": "BobaZooba/AntModel-7B-XLLM-Demo-LoRA",
86
  "hub_private_repo": false,
87
  "neftune_noise_alpha": null,
88
+ "project_name": null,
89
  "report_to_wandb": false,
90
  "wandb_api_key": null,
91
  "wandb_project": null,