{ "bits": 4, "dynamic": { ".*\\.1\\..*q_proj.*": { "bits": 8, "group_size": 32 }, ".*\\.1\\..*k_proj.*": { "bits": 8, "group_size": 32 }, ".*\\.1\\..*v_proj.*": { "bits": 8, "group_size": 32 }, "lm_head": { "bits": 8, "group_size": 32, "sym": true, "desc_act": false, "mse": 2.4 } }, "group_size": 128, "desc_act": true, "sym": false, "lm_head": true, "quant_method": "gptq", "checkpoint_format": "gptq", "pack_dtype": "int32", "meta": { "quantizer": [ "gptqmodel:2.0.0-dev" ], "uri": "https://github.com/modelcloud/gptqmodel", "damp_percent": 0.01, "damp_auto_increment": 0.0025, "static_groups": false, "true_sequential": true, "mse": 0.0 } }