Llama-3.1-8B-Instruct-quip-sharp-4bit / quantization_config.json
kharinaev's picture
Upload folder using huggingface_hub
81fb2dd verified
{
"quant_method": "QUiP",
"rescale_WH": false,
"use_rand": true,
"codebook": "E8P12RVQ4B",
"codesz": 8,
"idx_dtype": "torch.int32",
"merge_suv": false,
"per_channel": false,
"opt_resid_scale": -1,
"modules_to_not_convert": null
}