Chryslerx10's picture
Upload quantization_config.json with huggingface_hub
617f12f verified
raw
history blame
398 Bytes
{"quant_method": "bitsandbytes", "_load_in_8bit": true, "_load_in_4bit": false, "llm_int8_threshold": 6.0, "llm_int8_skip_modules": null, "llm_int8_enable_fp32_cpu_offload": false, "llm_int8_has_fp16_weight": false, "bnb_4bit_quant_type": "fp4", "bnb_4bit_use_double_quant": false, "bnb_4bit_compute_dtype": "float32", "bnb_4bit_quant_storage": "uint8", "load_in_4bit": false, "load_in_8bit": true}