from dataclasses import dataclass
from enum import Enum
@dataclass
class Task:
benchmark: str
metric: str
col_name: str
# Init: to update with your specific keys
class Tasks(Enum):
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
task0 = Task("MMLU", "metric_name", "MMLU")
task1 = Task("task_1", "metric_name", "task_1")
task2 = Task("task_2", "metric_name", "task_2")
task3 = Task("task_3", "metric_name", "task_3")
task4 = Task("task_4", "metric_name", "task_4")
# Your leaderboard name
TITLE = """
Azerbaijani LLM Leaderboard
"""
# What does your leaderboard evaluate?
INTRODUCTION_TEXT = """
Welcome to Kapital Bank's Azerbaijani LLM Leaderboard. We use benchmarks in finance, banking, and general knowledge for accurate evaluations.
🚀 Submit Your Model 🚀
If you have a fine-tuned Azerbaijani LLM, submit it for evaluation!
"""
EVALUATION_QUEUE_TEXT = """
## Some good practices before submitting a model
### 1) Make sure your model exists on hub.
### 2) Make sure your model is public.
## In case of model failure
If your model is displayed in the `FAILED` category, its execution stopped.
Make sure you have followed the above steps first.
Please contact us if you are facing any trouble!
"""