{ "q8": { "per_model_config": { "text_encoder": { "op_types": [ "Abs", "Add", "Cast", "Concat", "Constant", "ConstantOfShape", "Div", "Gather", "Greater", "Less", "Log", "MatMul", "Min", "Mul", "Pow", "Range", "ReduceMean", "Relu", "Reshape", "Shape", "Softmax", "Sqrt", "Sub", "Transpose", "Unsqueeze", "Where" ], "weight_type": "QInt8" }, "decoder_with_past_model": { "op_types": [ "Add", "Cast", "Concat", "Constant", "Div", "Erf", "Gather", "MatMul", "Mul", "Pow", "Range", "ReduceMean", "Reshape", "Shape", "Softmax", "Sqrt", "Sub", "Transpose", "Unsqueeze" ], "weight_type": "QInt8" }, "decoder_model": { "op_types": [ "Add", "Cast", "Concat", "Constant", "ConstantOfShape", "Div", "Equal", "Erf", "Expand", "Gather", "Less", "MatMul", "Mul", "Pow", "Range", "ReduceMean", "Reshape", "Shape", "Slice", "Softmax", "Sqrt", "Squeeze", "Sub", "Transpose", "Unsqueeze", "Where" ], "weight_type": "QInt8" }, "encodec_decode": { "op_types": [ "Add", "Cast", "Ceil", "Concat", "Constant", "ConstantOfShape", "Conv", "ConvTranspose", "Div", "Elu", "Gather", "LSTM", "Pad", "Reshape", "Shape", "Slice", "Split", "Squeeze", "Sub", "Transpose", "Unsqueeze" ], "weight_type": "QUInt8" }, "encodec_encoder": { "op_types": [ "Add", "ArgMax", "Cast", "Ceil", "Concat", "ConcatFromSequence", "Constant", "ConstantOfShape", "Conv", "Div", "Elu", "Equal", "Expand", "Gather", "Identity", "If", "LSTM", "LessOrEqual", "Loop", "MatMul", "Max", "Mul", "Neg", "Pad", "Pow", "ReduceL2", "ReduceMin", "ReduceSum", "Reshape", "ScatterND", "SequenceEmpty", "SequenceInsert", "Shape", "Slice", "Squeeze", "Sub", "Transpose", "Unsqueeze", "Where" ], "weight_type": "QUInt8" }, "decoder_model_merged": { "op_types": [ "Add", "Cast", "Concat", "Constant", "ConstantOfShape", "Div", "Equal", "Erf", "Expand", "Gather", "If", "Less", "MatMul", "Mul", "Pow", "Range", "ReduceMean", "Reshape", "Shape", "Slice", "Softmax", "Sqrt", "Squeeze", "Sub", "Transpose", "Unsqueeze", "Where" ], "weight_type": "QInt8" } }, "per_channel": false, "reduce_range": false } }