aisuko commited on
Commit
e3c3825
1 Parent(s): 8b63d76

End of training

Browse files
README.md CHANGED
@@ -35,15 +35,16 @@ More information needed
35
 
36
  The following hyperparameters were used during training:
37
  - learning_rate: 0.0002
38
- - train_batch_size: 4
39
  - eval_batch_size: 8
40
  - seed: 42
41
- - gradient_accumulation_steps: 4
42
- - total_train_batch_size: 16
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: linear
45
  - lr_scheduler_warmup_ratio: 0.3
46
- - num_epochs: 1
 
47
 
48
  ### Training results
49
 
 
35
 
36
  The following hyperparameters were used during training:
37
  - learning_rate: 0.0002
38
+ - train_batch_size: 2
39
  - eval_batch_size: 8
40
  - seed: 42
41
+ - gradient_accumulation_steps: 6
42
+ - total_train_batch_size: 12
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: linear
45
  - lr_scheduler_warmup_ratio: 0.3
46
+ - num_epochs: 0.5
47
+ - mixed_precision_training: Native AMP
48
 
49
  ### Training results
50
 
adapter_config.json CHANGED
@@ -19,12 +19,12 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "v_proj",
23
- "up_proj",
24
- "q_proj",
25
  "k_proj",
 
26
  "gate_proj",
27
- "o_proj"
 
 
28
  ],
29
  "task_type": "CAUSAL_LM"
30
  }
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
 
 
22
  "k_proj",
23
+ "o_proj",
24
  "gate_proj",
25
+ "v_proj",
26
+ "up_proj",
27
+ "q_proj"
28
  ],
29
  "task_type": "CAUSAL_LM"
30
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df7b1734a2911736486068fcdd5e37c778ddc8cc2fe7c22c41206e2e0c3b8156
3
  size 32294376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9746eed984a839f3ddc00dcd0ee2bfce72abb6a4d0b758836c2173f569d1d21
3
  size 32294376
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f38b3629f392e31c7e03e3c2ef99e18d01de05a9525e160b1db4a8390c667150
3
- size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8a39c5a3204a96f81eb104a00060bcae8ec777318c46103c7a86ae7111fdbad
3
+ size 4347