base_model: meta-llama/Llama-3.1-8B-Instruct | |
architecture: LLAMA | |
gate_model: random | |
dtype: float16 | |
experts_per_token: 2 | |
attention_merge: mean | |
experts: | |
- source_model: meta-llama/Llama-3.1-8B-Instruct | |
positive_prompts: ["Llama-3.1-8B-Instruct"] | |
- source_model: arcee-ai/Llama-3.1-SuperNova-Lite | |
positive_prompts: ["SuperNova-Lite"] | |
- source_model: vicgalle/Configurable-Llama-3.1-8B-Instruct | |
positive_prompts: ["Vicgalle/configurable"] | |
- source_model: Vikhrmodels/Vikhr-Llama3.1-8B-Instruct-R-21-09-24 | |
positive_prompts: ["Vikhrmodels/Instuct"] | |
- source_model: arcee-ai/Llama-Spark | |
positive_prompts: ["Spark"] | |