chatglm3-6b-openvino-int4 / openvino_config.json
EntropyGenerator's picture
Add model files
e9e0260
raw
history blame
450 Bytes
{
"compression": null,
"dtype": "int4",
"input_info": null,
"optimum_version": "1.20.0",
"quantization_config": {
"all_layers": null,
"bits": 4,
"dataset": null,
"group_size": 128,
"ignored_scope": null,
"num_samples": null,
"quant_method": "default",
"ratio": 0.8,
"sensitivity_metric": null,
"sym": false,
"tokenizer": null
},
"save_onnx_model": false,
"transformers_version": "4.41.2"
}