{ | |
"bits": 4, | |
"group_size": 32, | |
"sym": true, | |
"data_type": "int", | |
"enable_quanted_input": true, | |
"enable_minmax_tuning": true, | |
"seqlen": 2048, | |
"batch_size": 8, | |
"scale_dtype": "torch.float16", | |
"lr": 0.005, | |
"minmax_lr": 0.005, | |
"gradient_accumulate_steps": 1, | |
"iters": 200, | |
"amp": true, | |
"nsamples": 128, | |
"low_gpu_mem_usage": false, | |
"to_quant_block_names": "language.model.layers", | |
"enable_norm_bias_tuning": false, | |
"dataset": "NeelNanda/pile-10k", | |
"autoround_version": "0.4.5", | |
"quant_method": "awq", | |
"zero_point": false, | |
"version": "gemm", | |
"modules_to_not_convert": [ | |
"vision.blocks", | |
"projector.layers", | |
"vision.attn_pool.q", | |
"vision.attn_pool.kv", | |
"vision.attn_pool.proj", | |
"vision.attn_pool.mlp.fc1", | |
"vision.attn_pool.mlp.fc2", | |
"language.lm_head" | |
] | |
} |