{ "per_channel": false, "reduce_range": false, "per_model_config": { "decoder_model": { "op_types": [ "Reshape", "Unsqueeze", "Pow", "Where", "Split", "Sqrt", "Squeeze", "Slice", "Softmax", "Gather", "Shape", "ConstantOfShape", "Add", "Tanh", "ReduceMean", "Cast", "Mul", "Div", "Sub", "Range", "Transpose", "Concat", "Gemm", "Constant", "MatMul" ], "weight_type": "QInt8" }, "decoder_with_past_model": { "op_types": [ "Reshape", "Unsqueeze", "Pow", "Where", "Split", "Sqrt", "Squeeze", "Slice", "Softmax", "Gather", "Shape", "ConstantOfShape", "Add", "Tanh", "ReduceMean", "Cast", "Mul", "Div", "Sub", "Range", "Transpose", "Concat", "Gemm", "Constant", "MatMul" ], "weight_type": "QInt8" }, "decoder_model_merged": { "op_types": [ "Reshape", "Unsqueeze", "Pow", "Where", "Split", "Sqrt", "Squeeze", "Slice", "Softmax", "Gather", "Shape", "ConstantOfShape", "Add", "Tanh", "ReduceMean", "Cast", "Mul", "Div", "Sub", "Range", "Transpose", "Concat", "Gemm", "Constant", "MatMul", "If" ], "weight_type": "QInt8" } } }