xiaozheyao
/

llama_moe_perf_experiments_5_experts

Upload folder using huggingface_hub

3b43619 verified 16 days ago

638 Bytes

	base_model: meta-llama/Llama-3.1-8B-Instruct
	architecture: LLAMA
	gate_model: random
	dtype: float16
	experts_per_token: 2
	attention_merge: mean
	experts:
	- source_model: meta-llama/Llama-3.1-8B-Instruct
	positive_prompts: ["Llama-3.1-8B-Instruct"]
	- source_model: arcee-ai/Llama-3.1-SuperNova-Lite
	positive_prompts: ["SuperNova-Lite"]
	- source_model: vicgalle/Configurable-Llama-3.1-8B-Instruct
	positive_prompts: ["Vicgalle/configurable"]
	- source_model: Vikhrmodels/Vikhr-Llama3.1-8B-Instruct-R-21-09-24
	positive_prompts: ["Vikhrmodels/Instuct"]
	- source_model: arcee-ai/Llama-Spark
	positive_prompts: ["Spark"]