TheBloke commited on
Commit
dcb46d7
1 Parent(s): 563e88c

Update for Transformers AWQ support

Browse files
Files changed (1) hide show
  1. config.json +9 -2
config.json CHANGED
@@ -34,5 +34,12 @@
34
  "torch_dtype": "float16",
35
  "transformers_version": "4.35.0",
36
  "use_cache": true,
37
- "vocab_size": 32000
38
- }
 
 
 
 
 
 
 
 
34
  "torch_dtype": "float16",
35
  "transformers_version": "4.35.0",
36
  "use_cache": true,
37
+ "vocab_size": 32000,
38
+ "quantization_config": {
39
+ "quant_method": "awq",
40
+ "zero_point": true,
41
+ "group_size": 128,
42
+ "bits": 4,
43
+ "version": "gemm"
44
+ }
45
+ }