marcsun13 HF staff commited on
Commit
78e0628
1 Parent(s): c200ffa

compatibility with transformers integration of awq

Browse files
Files changed (1) hide show
  1. config.json +8 -1
config.json CHANGED
@@ -22,5 +22,12 @@
22
  "transformers_version": "4.32.0.dev0",
23
  "use_cache": true,
24
  "vocab_size": 32000,
25
- "pad_token_id": 0
 
 
 
 
 
 
 
26
  }
 
22
  "transformers_version": "4.32.0.dev0",
23
  "use_cache": true,
24
  "vocab_size": 32000,
25
+ "pad_token_id": 0,
26
+ "quantization_config": {
27
+ "quant_method": "awq",
28
+ "zero_point": true,
29
+ "q_group_size": 128,
30
+ "w_bit": 4,
31
+ "version": "GEMM"
32
+ }
33
  }