TheBloke commited on
Commit
b01589c
1 Parent(s): b4306cd

Update for Transformers AWQ support

Browse files
Files changed (1) hide show
  1. config.json +9 -2
config.json CHANGED
@@ -40,5 +40,12 @@
40
  "unfreeze_mm_vision_tower": false,
41
  "use_cache": true,
42
  "use_mm_proj": true,
43
- "vocab_size": 32000
44
- }
 
 
 
 
 
 
 
 
40
  "unfreeze_mm_vision_tower": false,
41
  "use_cache": true,
42
  "use_mm_proj": true,
43
+ "vocab_size": 32000,
44
+ "quantization_config": {
45
+ "quant_method": "awq",
46
+ "zero_point": true,
47
+ "group_size": 128,
48
+ "bits": 4,
49
+ "version": "gemm"
50
+ }
51
+ }