{ "bits": 4, "group_size": 128, "sym": true, "data_type": "int", "seqlen": 1024, "batch_size": 80, "iters": 1000, "nsamples": 560, "autoround_version": "0.9.2", "block_name_to_quantize": "vlm.model.language_model.layers", "quant_method": "auto-round", "packing_format": "auto_round:auto_gptq" }