File size: 1,344 Bytes
c08abba af0f401 c08abba afb233a c08abba af0f401 c08abba af0f401 c08abba af0f401 c08abba af0f401 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 |
from dataclasses import dataclass
from enum import Enum
@dataclass
class Task:
benchmark: str
metric: str
col_name: str
# Init: to update with your specific keys
class Tasks(Enum):
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
task0 = Task("MMLU", "metric_name", "MMLU")
task1 = Task("task_1", "metric_name", "task_1")
task2 = Task("task_2", "metric_name", "task_2")
task3 = Task("task_3", "metric_name", "task_3")
task4 = Task("task_4", "metric_name", "task_4")
# Your leaderboard name
TITLE = """<h1 align="center" id="space-title"> Azerbaijani LLM Leaderboard</h1>"""
# What does your leaderboard evaluate?
INTRODUCTION_TEXT = """
Welcome to Kapital Bank's Azerbaijani LLM Leaderboard. We use benchmarks in finance, banking, and general knowledge for accurate evaluations.
π Submit Your Model π
If you have a fine-tuned Azerbaijani LLM, submit it for evaluation!
"""
EVALUATION_QUEUE_TEXT = """
## Some good practices before submitting a model
### 1) Make sure your model exists on hub.
### 2) Make sure your model is public.
## In case of model failure
If your model is displayed in the `FAILED` category, its execution stopped.
Make sure you have followed the above steps first.
Please contact us if you are facing any trouble!
""" |