{ | |
"one_external_file": true, | |
"opset": null, | |
"optimization": {}, | |
"optimum_version": "1.18.0.dev0", | |
"quantization": { | |
"activations_dtype": "QInt8", | |
"activations_symmetric": true, | |
"format": "QDQ", | |
"is_static": true, | |
"mode": "QLinearOps", | |
"nodes_to_exclude": [], | |
"nodes_to_quantize": [], | |
"operators_to_quantize": [ | |
"Conv", | |
"ConvTranspose", | |
"Gemm", | |
"Clip", | |
"Relu", | |
"Reshape", | |
"Transpose", | |
"Squeeze", | |
"Unsqueeze", | |
"Resize", | |
"MaxPool", | |
"AveragePool", | |
"MatMul", | |
"Split", | |
"Gather", | |
"Where", | |
"InstanceNormalization", | |
"LayerNormalization" | |
], | |
"per_channel": false, | |
"qdq_add_pair_to_weight": true, | |
"qdq_dedicated_pair": true, | |
"qdq_op_type_per_channel_support_to_axis": { | |
"MatMul": 1 | |
}, | |
"reduce_range": false, | |
"weights_dtype": "QInt8", | |
"weights_symmetric": true | |
}, | |
"transformers_version": "4.39.0.dev0", | |
"use_external_data_format": true | |
} | |