AlanRobotics commited on
Commit
c22867e
1 Parent(s): 5636ffe

Create quant_config.json

Browse files
Files changed (1) hide show
  1. quant_config.json +13 -0
quant_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "autoawq",
3
+ "bits": 4,
4
+ "do_fuse": false,
5
+ "exllama_config": null,
6
+ "fuse_max_seq_len": null,
7
+ "group_size": 128,
8
+ "modules_to_fuse": null,
9
+ "modules_to_not_convert": null,
10
+ "quant_method": "awq",
11
+ "version": "gemm",
12
+ "zero_point": true
13
+ }