chansung commited on
Commit
33e1318
1 Parent(s): 4671ebd

Training in progress, step 100

Browse files
adapter_config.json CHANGED
@@ -15,17 +15,17 @@
15
  "megatron_core": "megatron.core",
16
  "modules_to_save": null,
17
  "peft_type": "LORA",
18
- "r": 16,
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "down_proj",
23
- "k_proj",
24
  "o_proj",
25
- "v_proj",
26
- "up_proj",
27
  "q_proj",
28
- "gate_proj"
 
29
  ],
30
  "task_type": "CAUSAL_LM"
31
  }
 
15
  "megatron_core": "megatron.core",
16
  "modules_to_save": null,
17
  "peft_type": "LORA",
18
+ "r": 32,
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "gate_proj",
 
23
  "o_proj",
24
+ "k_proj",
25
+ "down_proj",
26
  "q_proj",
27
+ "up_proj",
28
+ "v_proj"
29
  ],
30
  "task_type": "CAUSAL_LM"
31
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5df096199927ddbdde200b1c71b8c291651dc6e208429f57711ce6ceef6530b2
3
- size 100060536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3f3e71a4da3a39a6cf7fdcb8dd60e4b87c3164ba403028d7d427b1b50a08331
3
+ size 200068904
runs/Apr11_22-49-38_deep-diver-main-rare-husky-1-0-0/events.out.tfevents.1712890281.deep-diver-main-rare-husky-1-0-0.520.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9533a1e5b09043cf2b202b59d59cf89a93c9b47849c11735a807e0c6b99d65d
3
+ size 14482
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8bd01b1aed0eccc61952c0117f4b0f1694e5f940bfc0eefb917e5f0275884f2
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e40efaf1ad8aaee40eb10508cecfe994c7d5d8ef3fa5ed3a0c0e553833fe313
3
  size 5112