tanmoy-in commited on
Commit
9ef4831
1 Parent(s): 5d117e0

End of training

Browse files
README.md CHANGED
@@ -6,6 +6,7 @@ tags:
6
  model-index:
7
  - name: opt-350m_bn
8
  results: []
 
9
  ---
10
 
11
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -29,6 +30,17 @@ More information needed
29
 
30
  ## Training procedure
31
 
 
 
 
 
 
 
 
 
 
 
 
32
  ### Training hyperparameters
33
 
34
  The following hyperparameters were used during training:
@@ -49,6 +61,7 @@ The following hyperparameters were used during training:
49
 
50
  ### Framework versions
51
 
 
52
  - Transformers 4.32.0.dev0
53
  - Pytorch 2.0.1+cu118
54
  - Datasets 2.14.2
 
6
  model-index:
7
  - name: opt-350m_bn
8
  results: []
9
+ library_name: peft
10
  ---
11
 
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
30
 
31
  ## Training procedure
32
 
33
+
34
+ The following `bitsandbytes` quantization config was used during training:
35
+ - load_in_8bit: False
36
+ - load_in_4bit: True
37
+ - llm_int8_threshold: 6.0
38
+ - llm_int8_skip_modules: None
39
+ - llm_int8_enable_fp32_cpu_offload: False
40
+ - llm_int8_has_fp16_weight: False
41
+ - bnb_4bit_quant_type: nf4
42
+ - bnb_4bit_use_double_quant: True
43
+ - bnb_4bit_compute_dtype: bfloat16
44
  ### Training hyperparameters
45
 
46
  The following hyperparameters were used during training:
 
61
 
62
  ### Framework versions
63
 
64
+ - PEFT 0.5.0.dev0
65
  - Transformers 4.32.0.dev0
66
  - Pytorch 2.0.1+cu118
67
  - Datasets 2.14.2
adapter_config.json CHANGED
@@ -15,7 +15,11 @@
15
  "revision": null,
16
  "target_modules": [
17
  "k_proj",
18
- "v_proj"
 
 
 
 
19
  ],
20
  "task_type": "CAUSAL_LM"
21
  }
 
15
  "revision": null,
16
  "target_modules": [
17
  "k_proj",
18
+ "v_proj",
19
+ "q_proj",
20
+ "out_proj",
21
+ "fc1",
22
+ "fc2"
23
  ],
24
  "task_type": "CAUSAL_LM"
25
  }
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d412b0d72e6a70690ee3fed3154f4fc6d33316fd0adc637c54fc766f12b39551
3
- size 3180689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64ef366d4d230e77bb5b94082145d62968fd3e112cfc0184b430dd58ff0bee36
3
+ size 14260493
runs/Aug02_17-38-46_b282177827ba/events.out.tfevents.1690997929.b282177827ba.5153.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9803df683dd501f1233df9ea5b9c5624c9d2827213b3f4cbe4b5b7d60a80cbe5
3
+ size 5638
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:025f62ea332d9ec034ad4586e0372a4a0fe24e8db9e983bd775194db1763c29b
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88c8560915f276db6070650b43ca82be3c68de10be316832ee1c18ced74bcd01
3
  size 3963