{ "compression": { "algorithm": "quantization", "export_to_onnx_standard_ops": false, "ignored_scopes": [ "{re}.*Embedding.*", "{re}.*add___.*", "{re}.*layer_norm_.*", "{re}.*matmul_1", "{re}.*__truediv__.*" ], "initializer": { "batchnorm_adaptation": { "num_bn_adaptation_samples": 0 }, "range": { "num_init_samples": 300, "type": "mean_min_max" } }, "overflow_fix": "enable", "preset": "mixed", "scope_overrides": { "activations": { "{re}.*matmul_0": { "mode": "symmetric" } } } }, "input_info": [ { "keyword": "input_ids", "sample_size": [ 1, 177 ], "type": "long" }, { "keyword": "token_type_ids", "sample_size": [ 1, 177 ], "type": "long" }, { "keyword": "attention_mask", "sample_size": [ 1, 177 ], "type": "long" } ], "optimum_version": "1.14.1", "save_onnx_model": false, "transformers_version": "4.35.2" }