{ "per_channel": true, "reduce_range": false, "use_external_data_format": true, "q_group_size": 128, "per_model_config": { "decoder_model_merged": { "op_types": [ "Constant", "Add", "Max", "ConstantOfShape", "Cast", "Gather", "Softmax", "Unsqueeze", "Expand", "Where", "Squeeze", "CumSum", "If", "Shape", "Reshape", "Equal", "Less", "Sub", "Transpose", "MatMul", "Mul", "Slice", "Range", "Pow", "Gemm", "Concat", "Sqrt", "Relu", "ReduceMean", "Div" ], "weight_type": "QInt8" } } }