nm-research commited on
Commit
553a419
1 Parent(s): ee09ad0

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. generation_config.json +14 -0
  2. recipe.yaml +12 -0
generation_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "pad_token_id": 151643,
9
+ "repetition_penalty": 1.05,
10
+ "temperature": 0.7,
11
+ "top_k": 20,
12
+ "top_p": 0.8,
13
+ "transformers_version": "4.45.1"
14
+ }
recipe.yaml ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ quant_stage:
2
+ quant_modifiers:
3
+ GPTQModifier:
4
+ sequential_update: true
5
+ dampening_frac: 0.1
6
+ ignore: [lm_head]
7
+ config_groups:
8
+ group_0:
9
+ weights: {num_bits: 4, type: int, symmetric: true, strategy: group, group_size: 128,
10
+ actorder: group}
11
+ targets: [Linear]
12
+ observer: mse