lucas0 commited on
Commit
824685b
1 Parent(s): c46421e

End of training

Browse files
Files changed (4) hide show
  1. README.md +13 -0
  2. adapter_config.json +2 -2
  3. adapter_model.bin +2 -2
  4. training_args.bin +1 -1
README.md CHANGED
@@ -6,6 +6,7 @@ tags:
6
  model-index:
7
  - name: empath-falcon-40b
8
  results: []
 
9
  ---
10
 
11
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -29,6 +30,17 @@ More information needed
29
 
30
  ## Training procedure
31
 
 
 
 
 
 
 
 
 
 
 
 
32
  ### Training hyperparameters
33
 
34
  The following hyperparameters were used during training:
@@ -49,6 +61,7 @@ The following hyperparameters were used during training:
49
 
50
  ### Framework versions
51
 
 
52
  - Transformers 4.32.0.dev0
53
  - Pytorch 2.0.1+cu117
54
  - Datasets 2.13.1
 
6
  model-index:
7
  - name: empath-falcon-40b
8
  results: []
9
+ library_name: peft
10
  ---
11
 
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
30
 
31
  ## Training procedure
32
 
33
+
34
+ The following `bitsandbytes` quantization config was used during training:
35
+ - load_in_8bit: False
36
+ - load_in_4bit: True
37
+ - llm_int8_threshold: 6.0
38
+ - llm_int8_skip_modules: None
39
+ - llm_int8_enable_fp32_cpu_offload: False
40
+ - llm_int8_has_fp16_weight: False
41
+ - bnb_4bit_quant_type: nf4
42
+ - bnb_4bit_use_double_quant: True
43
+ - bnb_4bit_compute_dtype: bfloat16
44
  ### Training hyperparameters
45
 
46
  The following hyperparameters were used during training:
 
61
 
62
  ### Framework versions
63
 
64
+ - PEFT 0.5.0.dev0
65
  - Transformers 4.32.0.dev0
66
  - Pytorch 2.0.1+cu117
67
  - Datasets 2.13.1
adapter_config.json CHANGED
@@ -7,11 +7,11 @@
7
  "init_lora_weights": true,
8
  "layers_pattern": null,
9
  "layers_to_transform": null,
10
- "lora_alpha": 32,
11
  "lora_dropout": 0.05,
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
- "r": 16,
15
  "revision": null,
16
  "target_modules": [
17
  "query_key_value"
 
7
  "init_lora_weights": true,
8
  "layers_pattern": null,
9
  "layers_to_transform": null,
10
+ "lora_alpha": 16,
11
  "lora_dropout": 0.05,
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
+ "r": 8,
15
  "revision": null,
16
  "target_modules": [
17
  "query_key_value"
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cbc9f3b68b90f08988808b6f7ed038cfba0eed2f3bd2abbb7e99bfd3fab4633
3
- size 66891693
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93fe090362ff55ab24beb1a0fdd2e430ab5191d4c3cb46716b2db91d12534475
3
+ size 33468333
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6274ce8cc7e2847f81a0e8d0e8e908a410ff83b628bc5a3ac1a00967ccc02e2b
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:316f9aa3c48e0068defab81ada070b2c4226de86bd2899e099977f0f6bce174d
3
  size 3963