from dataclasses import dataclass
from enum import Enum
import json
@dataclass
class Task:
benchmark: str
metric: str
col_name: str
# Init: to update with your specific keys
def create_task_list():
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
with open("src/datasets.json") as f:
data = json.load(f)
groups = []
names = []
for d in data:
groups.append(d['group'])
names.append(d['name'])
groups = list(set(groups))
tasks = []
grouped_tasks = []
for name in names:
tasks.append(Task(name, "metric_name", name))
for group in groups:
grouped_tasks.append(Task(group, "metric_name", group))
return tasks, grouped_tasks
# Your leaderboard name
TITLE = """
Azerbaijani LLM Leaderboard
"""
# What does your leaderboard evaluate?
INTRODUCTION_TEXT = """
## Azerbaijani Open LLM sponsored by Kapital Bank
The Azerbaijani Open LLM Leaderboard is sponsored by Kapital Bank to support and develop Azerbaijani language NLP. This leaderboard offers a clear and fair ranking of open-source Azerbaijani LLMs, helping researchers, developers, and the AI community work together to improve the quality and use of Azerbaijani language models.
Through this platform, we hope to bring useful AI technology to the Azerbaijani language and encourage models that are both locally relevant and internationally competitive.
Contributors: Special thanks to Bugra Sen, Emir Rahimov, Kavsar Huseynova, Mirakram Aghalarov, Firangiz Aslanova, Rashad Valiyev, Tabriz Gozalov, Gultac Muradova, Arzuman Abbasov and Qismat Salimov for their valuable contributions.
## Partners
This leaderboard is supported by Kapital Bank, LocalDocs, PRODATA LLC, and the AI R&D Center of Baku Higher Oil School.
"""
LLM_BENCHMARKS_TEXT = f"""
## Azerbaijani Open LLM sponsored by Kapital Bank
The Azerbaijani Open LLM Leaderboard is sponsored by Kapital Bank to support and develop Azerbaijani language NLP. This leaderboard offers a clear and fair ranking of open-source Azerbaijani LLMs, helping researchers, developers, and the AI community work together to improve the quality and use of Azerbaijani language models.
Through this platform, we hope to bring useful AI technology to the Azerbaijani language and encourage models that are both locally relevant and internationally competitive.PartnersThis leaderboard is supported by Kapital Bank, LocalDocs, PRODATA LLC, and the R&D Center of Baku Higher Oil School.
"""
LLM_DATASET_TEXT = f"""
## Banking Call Classification MC:
192 entries; multiple-choice classification for bank-client requests.
## Banking Exam MCQ:
200–300 multiple-choice questions based on university banking exam materials.
## Banking QA: 97 entries:
Question-answer pairs on Azerbaijani banking topics.
## Wiki CQA:
97 entries from Azerbaijani Wikipedia, with context, questions, and answers.
## GSM8K:
44 grade-school math problems to test multi-step reasoning.
## ARC:
Elementary science questions in Azerbaijani, testing knowledge and reasoning.
## Subject-Specific MCQs:
Questions across topics like informatics, history, physics, and more, each with 100 multiple-choice questions for specific subject knowledge.
"""
EVALUATION_QUEUE_TEXT = """
## Some good practices before submitting a model
### 1) Make sure your model exists on hub.
### 2) Make sure your model is public.
## In case of model failure
If your model is displayed in the `FAILED` category, its execution stopped.
Make sure you have followed the above steps first.
Please contact us if you are facing any trouble!
"""