{ "measurement": { "model.layers.0": { "accuracy": 0.9154543876647949, "total_bits": 539218464, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.1": { "accuracy": 0.9234476089477539, "total_bits": 694042656, "q_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.2": { "accuracy": 0.9642077088356018, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.3": { "accuracy": 0.9546152353286743, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.4": { "accuracy": 0.9506402015686035, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.5": { "accuracy": 0.9440557956695557, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.6": { "accuracy": 0.9394266605377197, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.7": { "accuracy": 0.9329638481140137, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.8": { "accuracy": 0.9258372783660889, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.9": { "accuracy": 0.9274423122406006, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.10": { "accuracy": 0.9295330047607422, "total_bits": 450454080, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.11": { "accuracy": 0.9301164150238037, "total_bits": 450454080, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.12": { "accuracy": 0.9286305904388428, "total_bits": 450454080, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.13": { "accuracy": 0.928272008895874, "total_bits": 450454080, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.14": { "accuracy": 0.9258906841278076, "total_bits": 450454080, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.15": { "accuracy": 0.9167225360870361, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.16": { "accuracy": 0.9192557334899902, "total_bits": 450454080, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.17": { "accuracy": 0.917506217956543, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.18": { "accuracy": 0.9152529239654541, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.19": { "accuracy": 0.9192636013031006, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.20": { "accuracy": 0.9172792434692383, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.21": { "accuracy": 0.9207854270935059, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.22": { "accuracy": 0.9163947105407715, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.23": { "accuracy": 0.919762372970581, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.24": { "accuracy": 0.9207882881164551, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.25": { "accuracy": 0.9172525405883789, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.26": { "accuracy": 0.9163837432861328, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.27": { "accuracy": 0.9160265922546387, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.28": { "accuracy": 0.9134340286254883, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.29": { "accuracy": 0.9112701416015625, "total_bits": 417425472, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.30": { "accuracy": 0.9056534767150879, "total_bits": 506189856, "q_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.31": { "accuracy": 0.9172563552856445, "total_bits": 605275680, "q_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "2": 64 }, "bits": [ 2 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } } } }