{ | |
"compression": { | |
"algorithm": "quantization", | |
"export_to_onnx_standard_ops": false, | |
"ignored_scopes": [ | |
"{re}.*Embedding.*", | |
"{re}.*add___.*", | |
"{re}.*layer_norm_.*", | |
"{re}.*matmul_1", | |
"{re}.*__truediv__.*" | |
], | |
"initializer": { | |
"batchnorm_adaptation": { | |
"num_bn_adaptation_samples": 0 | |
}, | |
"range": { | |
"num_init_samples": 300, | |
"type": "mean_min_max" | |
} | |
}, | |
"overflow_fix": "disable", | |
"preset": "mixed", | |
"scope_overrides": { | |
"activations": { | |
"{re}.*matmul_0": { | |
"mode": "symmetric" | |
} | |
} | |
} | |
}, | |
"input_info": null, | |
"optimum_version": "1.10.0", | |
"save_onnx_model": false, | |
"transformers_version": "4.32.0.dev0" | |
} | |