{ "bits": 4, "group_size": 128, "desc_act": false, "lm_head": false, "method": "gptq", "quant_method": "gptq", "format": "gptq", "checkpoint_format": "gptq", "pack_dtype": "int32", "meta": { "quantizer": [ "gptqmodel:6.1.0-dev" ], "uri": "https://github.com/modelcloud/gptqmodel", "damp_percent": 0.05, "damp_auto_increment": 0.01, "static_groups": false, "true_sequential": true, "mse": 2.0, "gptaq": null, "foem": { "alpha": 0.25, "beta": 0.2, "device": "auto" }, "act_group_aware": true, "fallback": { "strategy": "rtn", "threshold": "0.5%", "smooth": { "type": "mse", "group_size_threshold": 128, "steps": 32, "maxshrink": 0.9 } }, "offload_to_disk": true, "offload_to_disk_path": "/home/op/outputs/qwen36-27b/disk_offload_foem", "pack_impl": "cpu", "gc_mode": "interval", "wait_for_submodule_finalizers": true, "auto_forward_data_parallel": false, "dense_vram_strategy": "balanced", "dense_vram_strategy_devices": [ "cuda:0", "cuda:1", "cuda:2" ], "moe_vram_strategy": "exclusive", "moe_vram_strategy_devices": null, "activation_weighted_mse": true, "mock_quantization": false, "hessian": { "chunk_size": null, "chunk_bytes": null, "staging_dtype": "float32" } }, "sym": true }