{ "last_module_idx": 66, "measurement": { "lm_head.linear": null, "model.layers.0.mlp": [ { "accuracy": 0.8730959892272949, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.8765948822623805, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9008018468555651, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9091151325326217, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9383227511456138, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9430453024412456, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9541262105891579, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.967287330250991, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9705746393454703, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9686516084169087, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9724578041779367, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9839151925162265, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9862229855437028, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9911635784726394, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.991809930456312, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9943504980520198, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9975439762990725, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.0.self_attn": [ { "accuracy": 0.8612700261567768, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.8801858550623843, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.8964802340457314, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9275430315419247, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9324118526358354, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.936788000558552, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9488437646313718, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9539904186600133, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.95904982403705, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9602722902047007, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9684275137750726, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9708843701764157, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9720264077186584, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9750477028520483, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9844950923794195, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9873687522976022, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9874392010663685, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9930800646543503, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9966272558820876, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.1.mlp": [ { "accuracy": 0.921179263215316, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9251238986065513, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9440461334429289, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9526504905600297, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9602508921372264, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9633890327654386, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9730549329205563, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9778280760112562, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9804605982805553, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9794345498085022, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9818635724092785, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9892690675823312, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.990749152083146, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9938022353147206, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9944066299419654, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.996457904969391, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9976953624894744, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.1.self_attn": [ { "accuracy": 0.8895263295424611, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.8989138477726987, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9080119697671187, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9444709577058491, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9459643928628219, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9472815488514147, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9646844958004198, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9667092624463534, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9688348864254198, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9703405468087447, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.972328637775622, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9737888056980936, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9751590082519933, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9769504493788669, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9861624287931543, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9882780823268389, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9901950657367706, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9939727481258543, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973834441288522, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.10.mlp": [ { "accuracy": 0.9849354107128946, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9853180317502273, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.987446674390843, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9880191848466271, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9924242810199135, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.993029302672336, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9938914732713449, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9960943005586925, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9964303766426287, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9961118329512445, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9965932667255402, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9979988258135947, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9982863278373292, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989109550063547, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9989581531599948, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991326865397001, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996643284776885, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.10.self_attn": [ { "accuracy": 0.9771387059437601, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9778942277556971, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9835380551062132, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9884021564533836, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9887103642288008, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.988973656767293, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9939168789669087, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9942014703625127, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9946116346277689, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9947829842567444, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9944499338928022, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9948025173262546, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9959197048293916, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9962523932519712, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9977493497886156, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9981071756858575, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9983996254833121, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991033832101446, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9995300099743825, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.11.mlp": [ { "accuracy": 0.9859543427040702, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9862959212378452, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9882800014395463, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9888158636657816, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9928998860873675, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.993491740603196, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9942958696108115, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9963369577338821, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9966613093489095, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9963486073048491, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9968122039970598, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.998116803404532, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9983931272045562, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989744676767212, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990163237640732, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991798620965135, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999680617530095, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.11.self_attn": [ { "accuracy": 0.9796387317933535, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.980279803276062, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9855955525448448, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9895809402591303, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9898469887281719, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.990122106514479, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9945248933999162, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9947771265318519, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9951673334366397, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9953059373717559, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9949972394265627, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9953392191152823, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9964303393897257, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.996719733664864, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9980387871986941, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9983452495775724, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.998566523390381, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992265873343537, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.999575499396183, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.12.mlp": [ { "accuracy": 0.9870107487628335, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9873435144361696, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9891195665848883, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9896084085891121, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.993410565351185, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9939762161750543, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9946996499049036, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.996606760119137, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9968994965678767, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9965946599841118, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9970486691515696, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.998242580184811, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9985055241145586, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990344101465062, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990775612624068, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992230173788572, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996897902976918, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.12.self_attn": [ { "accuracy": 0.9794774667212838, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9802057241138659, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9853892232242384, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9894587609328722, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9898038459451575, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9900459882460142, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9944545120785111, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9947199327381033, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9951626203562084, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9952975052751993, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9949743877116003, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9953298066791735, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9964052172083604, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9967132371507192, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9980125244902937, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9983352761911718, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9985426062423932, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992257214004272, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9995722048670838, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.13.mlp": [ { "accuracy": 0.987623354322032, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9879512151605204, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9896331186357298, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9900776845844168, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9937244002756319, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9942926811544519, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9949640067000138, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9967787318715924, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9970653935482627, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.996767032695444, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9971982093625947, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9983276103280092, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9985852405232819, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990856257316313, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991190861910582, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992483475882756, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997067060566655, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.13.self_attn": [ { "accuracy": 0.9828554783996782, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9834067774446387, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9879215955734253, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9910149958572889, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9916526455628244, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9918705773980994, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9955159751208205, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9957430539162535, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9960923469380328, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9962013371680912, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9959250072899618, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9962140102135507, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9971167011872718, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9973495433989324, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9984122467668433, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9986572687171007, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9988320752194053, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993663337571841, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9996400609563448, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.14.mlp": [ { "accuracy": 0.9875233157684928, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9878479265852979, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9895368751726652, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9899993993734059, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.993670018487855, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9942215884986677, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9949082202817264, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9967446970312219, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9970247843547871, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9967384052119757, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9971630753655183, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9983114574692751, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9985628125110739, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990688124181408, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991110992666922, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992442513865075, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996968482277895, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.14.self_attn": [ { "accuracy": 0.9838174518785978, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9843719727114627, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9887045284635142, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9914546130519164, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9918653510118786, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9921123667767173, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9955721293625078, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9958132850496393, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9961087554693222, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9962163759689582, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.996002895659522, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9962843621247693, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9971789945113031, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.997416727048786, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9984408949354762, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9986861550102109, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9988319963020714, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.99938597490913, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9996462815049055, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.15.mlp": [ { "accuracy": 0.9882000120062577, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9885095122613405, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9901390922696967, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9905651133311423, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9940665262310129, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9945779082022215, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9952104381824795, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9969584867358208, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9972118480425132, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9969432953941194, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9973416069620534, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9984195449046398, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9986543961261448, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991310028065192, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991681857132598, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992899579535189, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997181078468106, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.15.self_attn": [ { "accuracy": 0.9853537082672119, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9859135260707453, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.989625019462485, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9922217765921041, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9927457649456827, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.992907171186648, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.996068970545342, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9962714479157799, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9965135682570306, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9966247920927248, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9964421787544301, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9966720444591421, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974600588412661, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9976655446777218, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9985932309768701, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9988174711010958, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989604161758172, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9994376788504029, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9996740988357679, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.16.mlp": [ { "accuracy": 0.9893458658143094, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9895959684723302, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9910526385432795, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9914410247614509, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9946083414711451, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9950692045845484, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9956511004190696, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9972384309298113, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974701265363317, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9972266358764548, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9975864961743355, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9985627785913254, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9987755586442194, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992064898343462, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992397114340412, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993506253844029, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997363893903399, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.16.self_attn": [ { "accuracy": 0.9865257238086901, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9870655850360268, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9904793751867194, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9928415903919622, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9932580794158735, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9934131628588626, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9962535582874951, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9964618118185746, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9967471127839465, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9968351717842253, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9967037309941492, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9969354577754673, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976420824072862, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9978411754495219, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9986936175509503, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9989057820486394, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990166619812187, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9994790970690941, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9996907184096543, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.17.mlp": [ { "accuracy": 0.9897267928248957, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9899528842223319, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9914044439792633, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.991797514651951, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9947872601057354, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9952365658000896, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9958259671142227, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973235530288596, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975615282984156, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973176941275597, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9976620013384443, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9986071402305051, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9988167626097014, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992339001772436, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.99926495973609, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993770516134406, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997475628594035, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.17.self_attn": [ { "accuracy": 0.9886449018591329, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9891612255259564, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9921635969689018, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.993950290115256, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9943691464631181, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9944795087764138, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9969525437213873, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9970880876246252, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.99732908253607, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973922760078782, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9972340709676868, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9974341131746769, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9980946502795345, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9982492666887609, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989442581212834, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991107380115672, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991999070993379, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995751509835061, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997397776153919, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.18.mlp": [ { "accuracy": 0.9891724594329533, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9893685767525121, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9910712642105002, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9915990217735893, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9945086954455626, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9949573717619243, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9957504950855908, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9971308437617201, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.997401583351587, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.997146016280902, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9975201028742289, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9985156167102488, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9987299474642465, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991644729713076, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992069929446045, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993538156053737, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996845768274445, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.18.self_attn": [ { "accuracy": 0.9889059780459655, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9893004807986712, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9922221710807398, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9939199882118326, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9943547762538257, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9945436935675772, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9968924018505373, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9970508141345099, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9973028966862905, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973666095419934, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9972681769807088, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9974800565917241, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9980883045416129, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9982407877319738, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989417998218223, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991059720908341, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991892392894155, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995719495376474, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997385811354769, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.19.mlp": [ { "accuracy": 0.9902032543169824, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9904165613023859, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9917339392398533, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9920873194932938, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9950326551732264, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9954507782271034, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9959858236344237, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974483098638686, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976797758748657, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974413349440223, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9977723330651459, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9986741869269233, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9988692217555485, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992718798549551, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992985039655315, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993958580062577, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997637082920655, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.19.self_attn": [ { "accuracy": 0.9899442784096065, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9904114580468127, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9929309903006804, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9943358772679379, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9949542880058289, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9951300797493834, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9972042125698767, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9973608171077151, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9976215125306657, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976868149089185, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.99758438452294, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9977698159453116, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9983355873509457, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9984699382789826, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990822985572251, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992158507045946, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992867486649438, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999630064997626, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.999766306044828, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.2.mlp": [ { "accuracy": 0.9645276477462367, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.965232180921655, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9711361370588604, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9729378286160921, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9818323144787237, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9833754254014868, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9859896568875564, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9905942600024374, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9915031273114053, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9906871365873438, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9918833923967261, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9952232022034494, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9959380042396093, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974319478006739, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9975541612427485, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9980885855069286, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992834124223966, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.2.self_attn": [ { "accuracy": 0.9237543093530756, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9276719720740068, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9363078192660683, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.959135607669228, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9623121901562339, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.962625149049257, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.978696490588941, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9790957648503152, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9804453771365317, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9814739729228773, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9808463077796133, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9819487741118983, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9837646280464373, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9849483637433303, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9911041416619953, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.99239439948609, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9943860690844687, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9960547422892169, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9984863251447678, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.20.mlp": [ { "accuracy": 0.9890060738513344, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9892624483296746, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9913419618418342, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9920650501000253, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9943055236025861, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.99479189593541, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.995808377077705, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9970046842568799, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973210964940096, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9970653319829389, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9974443020397111, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9984775022848656, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9987037738687113, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991606553330233, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991998552883926, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993949229583928, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997174779051229, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.20.self_attn": [ { "accuracy": 0.989389128590885, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9899768609749643, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9924891214621695, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9941255611024404, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9947114853482497, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9948525722873839, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9970268171868826, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9971417870960737, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9974139491586309, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974898272439053, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974413645502768, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.997613892743462, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9981670273762, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9983376378291532, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989859425511799, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991421266213844, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992281499956, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995698522482264, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997479860964966, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.21.mlp": [ { "accuracy": 0.9903992939936487, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9906064326825895, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9918473441349832, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9921871204125253, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.995114442157118, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9955413639545441, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9960627006857019, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974657267724213, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9977150549621958, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974824137201435, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9978174529969692, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9986909325969847, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.998886980704571, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992717835856112, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993079650754991, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9994025735282585, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997552397758945, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.21.self_attn": [ { "accuracy": 0.9897454208449313, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9901039286663658, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9923692988721948, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.994056155022822, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9949007646033639, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.995028421674904, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9971694193388286, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9973240394733454, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9975245838102541, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975989076652025, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975412746793345, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9977078324085787, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9981883634862146, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9983305213482756, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990027330227589, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991424721910765, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992566013610676, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995739650177328, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997482070650318, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.22.mlp": [ { "accuracy": 0.9899730196124629, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9902052400927794, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.991534768750793, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9919028486076155, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9948992156668713, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9953280095207063, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9958950461525666, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973623789846897, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976130563177561, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973780457910738, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9977141797150436, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9986393627171454, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9988375999229518, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992496966825504, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992812349902171, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993848222258844, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997536087849814, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.22.self_attn": [ { "accuracy": 0.9902591140646684, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9905542448947304, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9930853467238577, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9944551983161977, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9951472564747459, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9953178716333289, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9972812041248146, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.997440910849132, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9976792508050015, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9977406282958231, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976605294566405, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9978491979602137, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9983302564605286, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9984773316077495, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990748337617046, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992224040784334, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992876899379649, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999613924834289, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997601158867934, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.23.mlp": [ { "accuracy": 0.9889686837008125, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9891947358846664, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9905904625591478, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9909770951459282, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9943621444859003, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9948567038303927, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9954520487471631, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9970748204933969, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973747510659067, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9971028564399794, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9974856013922315, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9984958778674665, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9987215607574111, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991709133119959, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992074572824334, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993144681089019, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9997293661887708, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.23.self_attn": [ { "accuracy": 0.989592894911766, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9899579545384959, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9925546120656165, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.994034690292258, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9948168585174962, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9949440073810125, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9971520292915796, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9973252025481901, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9975376536971644, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976255330992373, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975607036367843, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9977127474389578, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.998229216392103, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9983826286502575, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990248029169283, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991625051357245, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.99925824274358, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995899818543541, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997508915043191, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.24.mlp": [ { "accuracy": 0.9876262412259453, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9878866217638317, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.989540525172886, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9900428417481875, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9936250436462855, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9941586612870819, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9949140325188637, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9966689669772199, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9970015238382315, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9967169008756939, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9971424143173193, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.998300920191564, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9985513763600274, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990595538953417, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991081193285553, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992492648429776, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996957090732298, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.24.self_attn": [ { "accuracy": 0.9889004983400044, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9894250113713113, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9919391415621105, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9937304446571752, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9944762230703705, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9946464578572073, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9969530287933978, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9971033866076093, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.997318610745041, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974069265942824, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973535418118301, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.997522447454302, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9980449217714762, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9981900506505841, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989118587813879, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990766208226743, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991921051650455, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995352733684214, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997263715455407, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.25.mlp": [ { "accuracy": 0.9867914742545077, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9870394382037615, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9890362439971221, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9897196057595705, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9931248332324781, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9936614875730715, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9946174872548956, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9963529427584848, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9967212028017169, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9964555027453523, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.996896356540291, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9981637004958955, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9984223748508253, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.998972020259029, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990320825263074, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992111722301495, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996593787677979, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.25.self_attn": [ { "accuracy": 0.9889322848696458, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.989354448883157, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9915782542605149, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9934531109113443, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.994444990628644, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9945628133259321, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.996883143719874, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9970096026204134, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.99734486325791, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974712286340562, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973644486775524, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9975786891422773, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9980155841300362, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.998178350886232, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9988944959875784, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990634850569462, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992008841057357, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995169374895724, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.999720014019036, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.26.mlp": [ { "accuracy": 0.9874094991307509, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9876729430336701, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9892878414768922, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.989801434309859, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9935056555428003, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9940243567291059, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9947637190159998, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.996604647291334, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9969235856674219, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.996662786132411, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9970723688602448, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9982679388240764, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9985119797485439, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990383122900599, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990857369021365, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992244748496696, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996854557508701, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.26.self_attn": [ { "accuracy": 0.9893747975951747, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9897651044945968, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9919730417038265, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9936749150878504, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9946892414438097, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9948024565452024, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9971732505057987, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9973052781271307, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9974946809050284, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975950008160189, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974322250406993, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9976400099694729, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9981008197524046, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9982342931785082, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989371346799951, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990891254457989, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992474572438943, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999532123488423, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997385522399685, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.27.mlp": [ { "accuracy": 0.9867934286594391, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9870269008372959, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9888405909663752, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9894501355133558, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9931435020346391, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9937108723740828, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9945699384337977, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9963803259949935, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9967450097595391, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9964600232870955, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9969066275577796, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9981600971598374, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9984266959915036, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989679992002877, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990223592245265, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991831183433533, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996603666804731, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.27.self_attn": [ { "accuracy": 0.9891316302512821, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9895264804363251, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9915416381861034, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9934334786314714, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9945509527858934, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9946090261402883, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9969463301332373, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9970701387838313, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9972767286786908, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9974570301802534, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973444105371049, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9975327996439055, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9979307784845954, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9981030317905702, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9988635364723834, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990314663828987, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991998994036725, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9994899867788741, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997191210522464, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.28.mlp": [ { "accuracy": 0.986006802634189, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9863024181441257, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9881081094867304, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9886849350050876, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9928124554847416, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9933893868797704, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.994210516151629, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9962253437230462, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9965993977690998, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9962935737873378, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9967654788572538, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9980591763007013, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9983599318289443, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989282479999881, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9989789512596632, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9991323418523136, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996578142193979, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.28.self_attn": [ { "accuracy": 0.9892925486752862, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9896226619419298, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9915374078248677, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9934218851359267, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9948028976980009, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9948883288000759, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9972958941208688, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.997386172413826, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9975303068364921, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976820406552992, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975386146259936, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9977079141688975, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9980582171364835, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9981827653552356, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9989151631138826, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990728112231744, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992702332276263, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999509840321384, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997434601628858, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.29.mlp": [ { "accuracy": 0.984859973192215, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9851583022820322, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.98733772494291, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9880524324743372, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9922217734550175, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9928152851368252, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9938149679648248, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9959180394285604, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9963001318668064, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9960009828209877, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9964871826140504, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9979332958004976, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9982176774034375, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9988469638322529, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9989121228848633, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999104205322893, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996283762156963, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.29.self_attn": [ { "accuracy": 0.990615156136061, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9910636638340197, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9928124907769655, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9942561423307971, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9952715917637474, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9954988878024252, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9976028494144741, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9977262563219196, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9978799080770266, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.99796301793111, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9978484229037636, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9980133528772154, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.998335707148439, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9984769432952529, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9990790280464449, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9992035727849916, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9993591597303748, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995744312182069, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.999765266958428, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.3.mlp": [ { "accuracy": 0.9660069879732633, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9667053850073564, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9721953712011638, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9738085269927979, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9826900457081041, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9841014585996929, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9864911656630667, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9910356888645574, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9918867035915977, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9911350152994457, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9922410100698471, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9954543235270601, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9961194980301356, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975606614821836, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9976695856373561, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9981595095443098, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993202167710191, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.3.self_attn": [ { "accuracy": 0.9411274947618183, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9435727470799496, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9544082001635903, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9700790518208554, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.970873584872798, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9712647387855932, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9842720000367415, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9847273167810942, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9856875460398825, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9862778108370932, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9853531043780478, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9862835328829916, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.988594095173635, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9894368083853471, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9937564126755062, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9946811391334784, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9958789595647862, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9973987884035236, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.998889689088652, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.30.mlp": [ { "accuracy": 0.9832747217855955, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9836342413174478, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9859806534491087, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9866924521170164, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9915279628414857, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9921830633753225, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9932098796493128, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9955972786012449, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9959974806559714, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9956557138970024, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9961921360931898, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9977695594884848, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9980781121473563, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9987699712969755, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9988364016539172, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990390708768054, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996149393631831, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.30.self_attn": [ { "accuracy": 0.9911998353506389, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9923534503108576, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9937469147537884, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9950852480373884, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9962765974433798, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9963656989367384, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9979183564060613, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9980221114268428, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9982179550355986, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9983034761328446, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9982158973028785, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9983462867768187, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9985441990980977, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9986601197405865, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9991831005011734, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999299626160217, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9994402296939179, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9995934578443044, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997787127075227, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.31.mlp": [ { "accuracy": 0.9779956654498452, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9785450351865668, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.982160315701836, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9831615419764268, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9899066419977891, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9906808671198393, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9920512265280673, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9947460309455269, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9952400346335611, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9948624584235644, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9954920371896342, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9973171398435768, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9976873091961208, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9984779265758238, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9985725890452924, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9988628324905509, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9994804777303025, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.31.self_attn": [ { "accuracy": 0.9924349549569582, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9930255852247539, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9942911514326146, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9958426215146717, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.996810062543342, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9968479936452288, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9982235857138508, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9982640182501391, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9984072103704277, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9985015047223944, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9984170064134034, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.998510306995166, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9986458109985841, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9987489728159026, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992272595041677, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993336785976824, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9994841281226591, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996056911339494, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9997641041041597, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.4.mlp": [ { "accuracy": 0.9692652350977847, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9698807754014668, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9747832605713292, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.976217845552846, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9842962434417323, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9856173992156982, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9877318410496962, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9918475362815355, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9926309295390782, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9919330171848598, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9929509358970743, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9958493478204075, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9964668484110581, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9977654916675467, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9978675258002783, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9983184712105676, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993670496011251, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.4.self_attn": [ { "accuracy": 0.9596399947216636, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9609555633444535, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.968053516588713, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9795166081503818, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9799944664302626, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.980242332345561, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9892967625668174, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9895691942227515, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.990243441180179, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9906637331372813, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9899495400880512, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9905810905130286, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9920102679415753, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.992618380408538, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9956378968138444, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9962783722501052, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9971909634768963, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9981797184599074, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9992189338234695, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.5.mlp": [ { "accuracy": 0.97052600509242, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9711648664976421, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.97576295231518, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9770827858071578, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9850433908010784, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9862332657763833, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9881862527445743, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9922158796536295, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.992936331190561, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9922990273488196, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9932518413192347, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9960304220256052, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9966150573209712, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9978609810534277, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.997959379302828, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9983776286244392, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9993935922454846, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.5.self_attn": [ { "accuracy": 0.9655253949918245, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9666899128964073, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.973620803732621, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9824556441683518, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9829565929739099, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9832285375971543, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9909247748161617, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9911921973291197, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9917657736100649, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9920810233605536, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9915041201993039, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9920296755276228, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9934406962833906, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9939269988160384, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9964218139648438, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9969419354670926, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976245604063335, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9985208352537531, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9993283460406881, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.6.mlp": [ { "accuracy": 0.9751924103812167, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9757431635731145, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9796459517980877, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9807553087410174, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9874281891082463, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9884397599257921, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9901079190404791, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9934718475530022, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9940516474215608, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.993530726746509, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.99432449238865, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9966698045793333, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9971494643311751, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9981964918735781, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9982801511099464, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9986357627142417, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9994705211077082, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.6.self_attn": [ { "accuracy": 0.9643647764858446, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.965514317939156, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9725214148822584, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9819346932988418, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9823814881475348, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.982659754000212, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9906184759579206, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9909015101821799, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9914885092722742, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9918134871282076, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9912222788522118, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9917462052483308, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9931705923456895, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9936614856123924, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.996264078115162, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9968056788570002, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975424304996666, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9984478455429014, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9993040693531695, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.7.mlp": [ { "accuracy": 0.9826737814827969, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9831155993436512, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.985715389251709, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9864209106093959, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9912537179495159, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9919771559928593, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9930339706571478, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9954842552542686, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.995880400663928, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9955058595851848, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9960718735268241, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9976840479985664, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9980265833437443, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9987417961421766, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9987953708164001, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999017917992253, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996151844235627, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.7.self_attn": [ { "accuracy": 0.9687355662647047, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9698032234844408, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9760464649451407, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9840364142468101, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9844947174975747, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9847554188025626, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9917424187848443, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9919972129558262, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9924897473109396, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9927802815249092, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9922616066117036, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9927253864313427, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9940077489928195, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9944389462471008, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.996710689444291, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9971844469638247, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9978163358020155, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9986242815656098, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9993757262924, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.8.mlp": [ { "accuracy": 0.9819767977062025, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9824202468520716, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9849714903455031, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9856669353811365, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9908808179591831, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9916211194113681, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9926731508029135, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9952804195253473, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9956920358695482, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9953121433132573, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9958923682570457, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.997583167137284, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9979324238864999, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9986886217405921, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.998746572552543, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9989662825276977, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.999601389747113, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.8.self_attn": [ { "accuracy": 0.973777069857246, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9746567512813368, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9804581717440957, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9866059516605578, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9869305460076583, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9872038113443475, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9930051996519691, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9932662076071689, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9937352479288453, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9939620357594992, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.993521631940415, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9939341901948577, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9951368201720087, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9955149598811802, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.997320073411653, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9977280013263226, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9981567438103651, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9989011114169108, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.999464362908743, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.9.mlp": [ { "accuracy": 0.9840545732724039, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 395461696, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9844386467808172, "down_proj": { "bits": [ 6, 3, 2 ], "bits_prop": [ 0.05, 0.2, 0.75 ], "group_size": { "2": 64, "3": 64, "6": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 409224256, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9867129231754103, "down_proj": { "bits": [ 5, 3 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "3": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 457272320, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9873271827635012, "down_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 512977920, "up_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.3, 0.7 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9919467787993582, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 128, "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 578397280, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9926072280657919, "down_proj": { "bits": [ 8, 4, 3 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "3": 32, "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 592872448, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9935292880001821, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 }, "total_bits": 637454432, "up_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "3": 32, "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9958454809690777, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 728741472, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9962043860240987, "down_proj": { "bits": [ 8, 4 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "4": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 739476480, "up_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9958592355251312, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 128, "5": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 751543392, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9963758772141055, "down_proj": { "bits": [ 8, 5, 4 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "4": 32, "5": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 766018560, "up_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9978638134504619, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 128, "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 924689504, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9981752653655253, "down_proj": { "bits": [ 8, 6, 5 ], "bits_prop": [ 0.05, 0.1, 0.85 ], "group_size": { "5": 32, "6": 32, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 939164672, "up_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9988399940101724, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "6": 128, "8": 32 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 1069524064, "up_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9988887686478464, "down_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.15, 0.85 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1110384896, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990804851251213, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 }, "total_bits": 1209999616, "up_proj": { "bits": [ 8, 6 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "6": 128, "8": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9996420119055792, "down_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "gate_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 1415520512, "up_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.layers.9.self_attn": [ { "accuracy": 0.9755286182227888, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 89665536, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.05, 0.95 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9763404287789997, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 92221440, "v_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.25, 0.75 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9821753768544448, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 95758848, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9875498359140596, "k_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 3, 2 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "2": 64, "3": 64 }, "scale_bits": 4 }, "total_bits": 112272384, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9877584811888243, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132913152, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9879977044306303, "k_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 128, "4": 128 }, "scale_bits": 4 }, "total_bits": 132980224, "v_proj": { "bits": [ 4, 3 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "3": 64, "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9934298349054236, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169613312, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9936664688744044, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 128 }, "scale_bits": 4 }, "total_bits": 169745920, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9941494119794745, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 64 }, "scale_bits": 4 }, "total_bits": 171195392, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.994344557978605, "k_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 }, "total_bits": 173563904, "v_proj": { "bits": [ 4 ], "bits_prop": [ 1 ], "group_size": { "4": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9939281250301161, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 128, "5": 128 }, "scale_bits": 4 }, "total_bits": 174923264, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9943419177281229, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 175750144, "v_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9955371512394202, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 64, "5": 64 }, "scale_bits": 4 }, "total_bits": 179253248, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 64 }, "scale_bits": 4 } }, { "accuracy": 0.9958875492999428, "k_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 5, 4 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "4": 32, "5": 32 }, "scale_bits": 4 }, "total_bits": 181592064, "v_proj": { "bits": [ 5 ], "bits_prop": [ 1 ], "group_size": { "5": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9975580231923806, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 128, "6": 128 }, "scale_bits": 4 }, "total_bits": 220469248, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9979260101130134, "k_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6, 5 ], "bits_prop": [ 0.1, 0.9 ], "group_size": { "5": 32, "6": 32 }, "scale_bits": 4 }, "total_bits": 223535104, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9982790823437666, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 }, "total_bits": 253499392, "v_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 128 }, "scale_bits": 4 } }, { "accuracy": 0.9990160990702478, "k_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "o_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "q_proj": { "bits": [ 6 ], "bits_prop": [ 1 ], "group_size": { "6": 32 }, "scale_bits": 4 }, "total_bits": 265838592, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 32 }, "scale_bits": 4 } }, { "accuracy": 0.9994997503235936, "k_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "o_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "q_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 }, "total_bits": 337385472, "v_proj": { "bits": [ 8 ], "bits_prop": [ 1 ], "group_size": { "8": 128 }, "scale_bits": 4 } } ], "model.norm.norm": null } }