01-Yi-6B-channel-mix-bpw-3.0 / quant_strategy.json
NicoNico6
update
b6b4d8f
{
"measurement": {
"model.layers.0": {
"accuracy": 0.9379796981811523,
"total_bits": 372683808,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
}
},
"model.layers.1": {
"accuracy": 0.940488338470459,
"total_bits": 402699296,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.1,
0.9
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.1,
0.9
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.2,
0.8
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.1,
0.9
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.1,
0.9
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.1,
0.9
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.2,
0.8
],
"scale_bits": 4
}
},
"model.layers.2": {
"accuracy": 0.9580041170120239,
"total_bits": 634565664,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
}
},
"model.layers.3": {
"accuracy": 0.9445068836212158,
"total_bits": 571651104,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
}
},
"model.layers.4": {
"accuracy": 0.9742113351821899,
"total_bits": 697480224,
"q_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.5": {
"accuracy": 0.9720273017883301,
"total_bits": 697480224,
"q_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.6": {
"accuracy": 0.9702110290527344,
"total_bits": 697480224,
"q_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.7": {
"accuracy": 0.9707947969436646,
"total_bits": 697480224,
"q_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.8": {
"accuracy": 0.9378645420074463,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.9": {
"accuracy": 0.9572443962097168,
"total_bits": 361673760,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.01,
0.99
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.01,
0.99
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.02,
0.98
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.01,
0.99
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.01,
0.99
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.02,
0.98
],
"scale_bits": 4
}
},
"model.layers.10": {
"accuracy": 0.9557219743728638,
"total_bits": 372683808,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
}
},
"model.layers.11": {
"accuracy": 0.954809308052063,
"total_bits": 405582880,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.4,
0.6
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.4,
0.6
],
"scale_bits": 4
}
},
"model.layers.12": {
"accuracy": 0.9504133462905884,
"total_bits": 405582880,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.4,
0.6
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.4,
0.6
],
"scale_bits": 4
}
},
"model.layers.13": {
"accuracy": 0.9481167793273926,
"total_bits": 405582880,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.4,
0.6
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.4,
0.6
],
"scale_bits": 4
}
},
"model.layers.14": {
"accuracy": 0.9468015432357788,
"total_bits": 405582880,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.4,
0.6
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.05,
0.95
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.4,
0.6
],
"scale_bits": 4
}
},
"model.layers.15": {
"accuracy": 0.9613559246063232,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.16": {
"accuracy": 0.960334300994873,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.17": {
"accuracy": 0.9556019306182861,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.18": {
"accuracy": 0.9482923746109009,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.19": {
"accuracy": 0.9474902153015137,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.20": {
"accuracy": 0.9444401264190674,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.21": {
"accuracy": 0.9444293975830078,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.22": {
"accuracy": 0.9623349905014038,
"total_bits": 634565664,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.75,
0.25
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
}
},
"model.layers.23": {
"accuracy": 0.9492499828338623,
"total_bits": 571651104,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
}
},
"model.layers.24": {
"accuracy": 0.9491121768951416,
"total_bits": 571651104,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
}
},
"model.layers.25": {
"accuracy": 0.9408369064331055,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.26": {
"accuracy": 0.9524426460266113,
"total_bits": 571651104,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.5,
0.5
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
}
},
"model.layers.27": {
"accuracy": 0.9414148330688477,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.28": {
"accuracy": 0.9438059329986572,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.29": {
"accuracy": 0.9475662708282471,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.30": {
"accuracy": 0.9529297351837158,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
},
"model.layers.31": {
"accuracy": 0.9391093254089355,
"total_bits": 508736544,
"q_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"k_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"v_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1.0
],
"scale_bits": 4
},
"o_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"up_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"gate_proj": {
"group_size": {
"4": 128,
"2": 128
},
"bits": [
4,
2
],
"bits_prop": [
0.25,
0.75
],
"scale_bits": 4
},
"down_proj": {
"group_size": {
"4": 128
},
"bits": [
4
],
"bits_prop": [
1
],
"scale_bits": 4
}
}
}
}