Fix the vllm deepspeedfp not found issue

#9
Files changed (1) hide show
  1. quant_config.json +6 -0
quant_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bits": 8,
3
+ "rounding": "nearest",
4
+ "mantissa_bits": 3,
5
+ "group_size": 512
6
+ }