{ | |
"batcher": null, | |
"cacher": null, | |
"compiler": null, | |
"factorizer": null, | |
"pruner": null, | |
"quantizer": "hqq", | |
"hqq_backend": "torchao_int4", | |
"hqq_compute_dtype": "torch.float16", | |
"hqq_group_size": 64, | |
"hqq_weight_bits": 4, | |
"batch_size": 1, | |
"device": "cuda", | |
"save_fns": [ | |
"hqq" | |
], | |
"load_fns": [ | |
"hqq" | |
], | |
"reapply_after_load": { | |
"factorizer": null, | |
"pruner": null, | |
"quantizer": null, | |
"cacher": null, | |
"compiler": null, | |
"batcher": null | |
}, | |
"api_key": null | |
} |