Rahmat82 commited on
Commit
13a75f6
1 Parent(s): e180368

added quantization_config

Browse files
Files changed (1) hide show
  1. config.json +9 -0
config.json CHANGED
@@ -53,4 +53,13 @@
53
  "transformers_version": "4.16.2",
54
  "use_cache": true,
55
  "vocab_size": 96103
 
 
 
 
 
 
 
 
 
56
  }
 
53
  "transformers_version": "4.16.2",
54
  "use_cache": true,
55
  "vocab_size": 96103
56
+ },
57
+
58
+ "quantization_config": {
59
+ "quant_method": "awq",
60
+ "zero_point": true,
61
+ "group_size": 128,
62
+ "bits": 4,
63
+ "version": "gemm"
64
+ }
65
  }