{ "one_external_file": true, "opset": null, "optimization": {}, "optimum_version": "1.18.0.dev0", "quantization": { "activations_dtype": "QInt8", "activations_symmetric": true, "format": "QDQ", "is_static": true, "mode": "QLinearOps", "nodes_to_exclude": [], "nodes_to_quantize": [], "operators_to_quantize": [ "Conv", "ConvTranspose", "Gemm", "Clip", "Relu", "Reshape", "Transpose", "Squeeze", "Unsqueeze", "Resize", "MaxPool", "AveragePool", "MatMul", "Split", "Gather", "Where", "InstanceNormalization", "LayerNormalization" ], "per_channel": false, "qdq_add_pair_to_weight": true, "qdq_dedicated_pair": true, "qdq_op_type_per_channel_support_to_axis": { "MatMul": 1 }, "reduce_range": false, "weights_dtype": "QInt8", "weights_symmetric": true }, "transformers_version": "4.39.0.dev0", "use_external_data_format": true }