| { | |
| "one_external_file": true, | |
| "opset": null, | |
| "optimization": {}, | |
| "optimum_version": "1.16.1", | |
| "quantization": { | |
| "activations_dtype": "QUInt8", | |
| "activations_symmetric": false, | |
| "format": "QOperator", | |
| "is_static": false, | |
| "mode": "IntegerOps", | |
| "nodes_to_exclude": [], | |
| "nodes_to_quantize": [], | |
| "operators_to_quantize": [ | |
| "Conv", | |
| "MatMul", | |
| "Attention", | |
| "LSTM", | |
| "Gather", | |
| "Transpose", | |
| "EmbedLayerNormalization" | |
| ], | |
| "per_channel": false, | |
| "qdq_add_pair_to_weight": false, | |
| "qdq_dedicated_pair": false, | |
| "qdq_op_type_per_channel_support_to_axis": { | |
| "MatMul": 1 | |
| }, | |
| "reduce_range": false, | |
| "weights_dtype": "QInt8", | |
| "weights_symmetric": true | |
| }, | |
| "transformers_version": "4.30.0", | |
| "use_external_data_format": false | |
| } | |
