fkjsdahfjkasf commited on
Commit
570866e
1 Parent(s): c430af6

fkjsdahfjkasf/sft-Llama-3-8B

Browse files
adapter_config.json CHANGED
@@ -15,21 +15,21 @@
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": [
18
- "embed_tokens",
19
- "lm_head"
20
  ],
21
  "peft_type": "LORA",
22
  "r": 16,
23
  "rank_pattern": {},
24
  "revision": "unsloth",
25
  "target_modules": [
 
26
  "k_proj",
 
27
  "gate_proj",
28
  "up_proj",
29
- "q_proj",
30
- "o_proj",
31
- "down_proj",
32
- "v_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
 
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": [
18
+ "lm_head",
19
+ "embed_tokens"
20
  ],
21
  "peft_type": "LORA",
22
  "r": 16,
23
  "rank_pattern": {},
24
  "revision": "unsloth",
25
  "target_modules": [
26
+ "q_proj",
27
  "k_proj",
28
+ "down_proj",
29
  "gate_proj",
30
  "up_proj",
31
+ "v_proj",
32
+ "o_proj"
 
 
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
runs/Jun10_00-44-06_150-136-147-171/events.out.tfevents.1717980250.150-136-147-171.16227.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c520a46f378e743a2533c57929b7b8088bfdfd3bb069f6c5606827622e6ab1a8
3
+ size 5723
trainer_state.json CHANGED
@@ -14,8 +14,8 @@
14
  "step": 1,
15
  "total_flos": 6348239762620416.0,
16
  "train_loss": 2.5150043964385986,
17
- "train_runtime": 45.5008,
18
- "train_samples_per_second": 0.352,
19
  "train_steps_per_second": 0.022
20
  }
21
  ],
 
14
  "step": 1,
15
  "total_flos": 6348239762620416.0,
16
  "train_loss": 2.5150043964385986,
17
+ "train_runtime": 45.5311,
18
+ "train_samples_per_second": 0.351,
19
  "train_steps_per_second": 0.022
20
  }
21
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e3ad79e0fa9bae84cea9f2ff76b21e0fd174a4b7ab94d8ed5bbcaff2563d4ee
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68234b6943b94c1487c8251f3f9a6e3ede15155d223d03798197eaf89641b76c
3
  size 5112