Update README.md
Browse files
README.md
CHANGED
@@ -2,7 +2,9 @@
|
|
2 |
base_model:
|
3 |
- deepseek-ai/DeepSeek-R1-Distill-Llama-8B
|
4 |
- mobiuslabsgmbh/DeepSeek-R1-ReDistill-Llama3-8B-v1.1
|
5 |
-
- avemio-digital/
|
|
|
|
|
6 |
library_name: transformers
|
7 |
tags:
|
8 |
- mergekit
|
@@ -22,7 +24,7 @@ This model was merged using the [DARE TIES](https://arxiv.org/abs/2311.03099) me
|
|
22 |
|
23 |
The following models were included in the merge:
|
24 |
* [mobiuslabsgmbh/DeepSeek-R1-ReDistill-Llama3-8B-v1.1](https://huggingface.co/mobiuslabsgmbh/DeepSeek-R1-ReDistill-Llama3-8B-v1.1)
|
25 |
-
* [avemio-digital/
|
26 |
|
27 |
### Configuration
|
28 |
|
@@ -32,7 +34,7 @@ The following YAML configuration was used to produce this model:
|
|
32 |
models:
|
33 |
- model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B
|
34 |
#no parameters necessary for base model
|
35 |
-
- model: avemio-digital/
|
36 |
parameters:
|
37 |
density: 0.5
|
38 |
weight: 0.5
|
|
|
2 |
base_model:
|
3 |
- deepseek-ai/DeepSeek-R1-Distill-Llama-8B
|
4 |
- mobiuslabsgmbh/DeepSeek-R1-ReDistill-Llama3-8B-v1.1
|
5 |
+
- avemio-digital/German-RAG-Mobius-DeepSeek-R1-ReDistill-LLAMA-8B-v1.1-SFT-DE
|
6 |
+
datasets:
|
7 |
+
- avemio/German-RAG-HARD-REASONING-DE-THINKING
|
8 |
library_name: transformers
|
9 |
tags:
|
10 |
- mergekit
|
|
|
24 |
|
25 |
The following models were included in the merge:
|
26 |
* [mobiuslabsgmbh/DeepSeek-R1-ReDistill-Llama3-8B-v1.1](https://huggingface.co/mobiuslabsgmbh/DeepSeek-R1-ReDistill-Llama3-8B-v1.1)
|
27 |
+
* [avemio-digital/German-RAG-Mobius-DeepSeek-R1-ReDistill-LLAMA-8B-v1.1-SFT-DE](https://huggingface.co/avemio-digital/German-RAG-Mobius-DeepSeek-R1-ReDistill-LLAMA-8B-v1.1-SFT-DE)
|
28 |
|
29 |
### Configuration
|
30 |
|
|
|
34 |
models:
|
35 |
- model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B
|
36 |
#no parameters necessary for base model
|
37 |
+
- model: avemio-digital/German-RAG-Mobius-DeepSeek-R1-ReDistill-LLAMA-8B-v1.1-SFT-DE
|
38 |
parameters:
|
39 |
density: 0.5
|
40 |
weight: 0.5
|