multilingual-e5-large-instruct / ort_config .json
yashvardhan7's picture
Upload 2 files
c6655d8 verified
raw
history blame
1.04 kB
{
"one_external_file": true,
"opset": null,
"optimization": {},
"optimum_version": "1.18.1",
"quantization": {
"activations_dtype": "QUInt8",
"activations_symmetric": false,
"format": "QDQ",
"is_static": true,
"mode": "QLinearOps",
"nodes_to_exclude": [],
"nodes_to_quantize": [],
"operators_to_quantize": [
"Conv",
"ConvTranspose",
"Gemm",
"Clip",
"Relu",
"Reshape",
"Transpose",
"Squeeze",
"Unsqueeze",
"Resize",
"MaxPool",
"AveragePool",
"MatMul",
"Split",
"Gather",
"Softmax",
"Where",
"InstanceNormalization",
"LayerNormalization"
],
"per_channel": false,
"qdq_add_pair_to_weight": false,
"qdq_dedicated_pair": false,
"qdq_op_type_per_channel_support_to_axis": {
"MatMul": 1
},
"reduce_range": false,
"weights_dtype": "QInt8",
"weights_symmetric": true
},
"transformers_version": "4.38.2",
"use_external_data_format": false
}