wyseow commited on
Commit
be280a1
1 Parent(s): 650741b

change to 4-bit quan config

Browse files
Files changed (1) hide show
  1. config.json +5 -5
config.json CHANGED
@@ -106,15 +106,15 @@
106
  "pad2square": false,
107
  "ps_version": "v2",
108
  "quantization_config": {
109
- "bnb_4bit_compute_dtype": "float32",
110
- "bnb_4bit_quant_type": "fp4",
111
- "bnb_4bit_use_double_quant": false,
112
  "llm_int8_enable_fp32_cpu_offload": true,
113
  "llm_int8_has_fp16_weight": false,
114
  "llm_int8_skip_modules": null,
115
  "llm_int8_threshold": 6.0,
116
- "load_in_4bit": false,
117
- "load_in_8bit": true,
118
  "quant_method": "bitsandbytes"
119
  },
120
  "select_layer": -1,
 
106
  "pad2square": false,
107
  "ps_version": "v2",
108
  "quantization_config": {
109
+ "bnb_4bit_compute_dtype": "bfloat16",
110
+ "bnb_4bit_quant_type": "nf4",
111
+ "bnb_4bit_use_double_quant": true,
112
  "llm_int8_enable_fp32_cpu_offload": true,
113
  "llm_int8_has_fp16_weight": false,
114
  "llm_int8_skip_modules": null,
115
  "llm_int8_threshold": 6.0,
116
+ "load_in_4bit": true,
117
+ "load_in_8bit": false,
118
  "quant_method": "bitsandbytes"
119
  },
120
  "select_layer": -1,