FuseAI
/

FuseChat-Llama-3.1-8B-Instruct

Safetensors

llama

Eval Results

Model card Files Files and versions Community

AALF commited on 3 days ago

Commit

007f2da

verified ·

1 Parent(s): 2cc7f69

Update README.md

Browse files

Files changed (1) hide show

README.md +15 -8

README.md CHANGED Viewed

@@ -16,7 +16,8 @@ model-index:
       value: 72.05
       name: averaged accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -32,7 +33,8 @@ model-index:
       value: 30.85
       name: normalized accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -48,7 +50,8 @@ model-index:
       value: 7.02
       name: exact match
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -64,7 +67,8 @@ model-index:
       value: 7.38
       name: acc_norm
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -79,7 +83,8 @@ model-index:
       value: 6.15
       name: acc_norm
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
@@ -96,8 +101,11 @@ model-index:
       value: 30.37
       name: accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
 ---
 <p align="center" width="100%">
 </p>
@@ -526,5 +534,4 @@ Summarized results can be found [here](https://huggingface.co/datasets/open-llm-
 |MATH Lvl 5 (4-Shot)|     7.02|
 |GPQA (0-shot)      |     7.38|
 |MuSR (0-shot)      |     6.15|
-|MMLU-PRO (5-shot)  |    30.37|

       value: 72.05
       name: averaged accuracy
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 30.85
       name: normalized accuracy
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 7.02
       name: exact match
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 7.38
       name: acc_norm
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 6.15
       name: acc_norm
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       value: 30.37
       name: accuracy
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=FuseAI%2FFuseChat-Llama-3.1-8B-Instruct
       name: Open LLM Leaderboard
+datasets:
+- FuseAI/FuseChat-3.0-DPO-Data
 ---
 <p align="center" width="100%">
 </p>
 |MATH Lvl 5 (4-Shot)|     7.02|
 |GPQA (0-shot)      |     7.38|
 |MuSR (0-shot)      |     6.15|
+|MMLU-PRO (5-shot)  |    30.37|