nm-testing
/

llama-2-7b-sparse2of4

compressed-tensors

Model card Files Files and versions Community

llama-2-7b-sparse2of4 / recipe.yaml

dsikka's picture

Upload folder using huggingface_hub

0658009 verified about 1 month ago

history blame contribute delete

563 Bytes

	sparsity_stage:
	sparsity_modifiers:
	SparseGPTModifier: {sparsity: 0.5, mask_structure: '2:4', sequential_update: false}
	run_type: !!python/object/apply:llmcompressor.recipe.stage.StageRunType [oneshot]
	finetuning_stage:
	finetuning_modifiers:
	ConstantPruningModifier:
	targets: ['re:.q_proj.weight', 're:.k_proj.weight', 're:.v_proj.weight', 're:.o_proj.weight',
	're:.gate_proj.weight', 're:.up_proj.weight', 're:.*down_proj.weight']
	start: 0
	run_type: !!python/object/apply:llmcompressor.recipe.stage.StageRunType [train]