{ "measurement": { "model.layers.0": { "accuracy": 0.9379796981811523, "total_bits": 372683808, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 } }, "model.layers.1": { "accuracy": 0.940488338470459, "total_bits": 402699296, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.1, 0.9 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.1, 0.9 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.2, 0.8 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.1, 0.9 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.1, 0.9 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.1, 0.9 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.2, 0.8 ], "scale_bits": 4 } }, "model.layers.2": { "accuracy": 0.9580041170120239, "total_bits": 634565664, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 } }, "model.layers.3": { "accuracy": 0.9445068836212158, "total_bits": 571651104, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 } }, "model.layers.4": { "accuracy": 0.9742113351821899, "total_bits": 697480224, "q_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.5": { "accuracy": 0.9720273017883301, "total_bits": 697480224, "q_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.6": { "accuracy": 0.9702110290527344, "total_bits": 697480224, "q_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.7": { "accuracy": 0.9707947969436646, "total_bits": 697480224, "q_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.8": { "accuracy": 0.9378645420074463, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.9": { "accuracy": 0.9572443962097168, "total_bits": 361673760, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.01, 0.99 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.01, 0.99 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.02, 0.98 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.01, 0.99 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.01, 0.99 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.02, 0.98 ], "scale_bits": 4 } }, "model.layers.10": { "accuracy": 0.9557219743728638, "total_bits": 372683808, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 } }, "model.layers.11": { "accuracy": 0.954809308052063, "total_bits": 405582880, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.4, 0.6 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.4, 0.6 ], "scale_bits": 4 } }, "model.layers.12": { "accuracy": 0.9504133462905884, "total_bits": 405582880, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.4, 0.6 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.4, 0.6 ], "scale_bits": 4 } }, "model.layers.13": { "accuracy": 0.9481167793273926, "total_bits": 405582880, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.4, 0.6 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.4, 0.6 ], "scale_bits": 4 } }, "model.layers.14": { "accuracy": 0.9468015432357788, "total_bits": 405582880, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.4, 0.6 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.05, 0.95 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.4, 0.6 ], "scale_bits": 4 } }, "model.layers.15": { "accuracy": 0.9613559246063232, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.16": { "accuracy": 0.960334300994873, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.17": { "accuracy": 0.9556019306182861, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.18": { "accuracy": 0.9482923746109009, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.19": { "accuracy": 0.9474902153015137, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.20": { "accuracy": 0.9444401264190674, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.21": { "accuracy": 0.9444293975830078, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.22": { "accuracy": 0.9623349905014038, "total_bits": 634565664, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.75, 0.25 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 } }, "model.layers.23": { "accuracy": 0.9492499828338623, "total_bits": 571651104, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 } }, "model.layers.24": { "accuracy": 0.9491121768951416, "total_bits": 571651104, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 } }, "model.layers.25": { "accuracy": 0.9408369064331055, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.26": { "accuracy": 0.9524426460266113, "total_bits": 571651104, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.5, 0.5 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 } }, "model.layers.27": { "accuracy": 0.9414148330688477, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.28": { "accuracy": 0.9438059329986572, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.29": { "accuracy": 0.9475662708282471, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.30": { "accuracy": 0.9529297351837158, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } }, "model.layers.31": { "accuracy": 0.9391093254089355, "total_bits": 508736544, "q_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "k_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "v_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1.0 ], "scale_bits": 4 }, "o_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "up_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "gate_proj": { "group_size": { "4": 128, "2": 128 }, "bits": [ 4, 2 ], "bits_prop": [ 0.25, 0.75 ], "scale_bits": 4 }, "down_proj": { "group_size": { "4": 128 }, "bits": [ 4 ], "bits_prop": [ 1 ], "scale_bits": 4 } } } }