File size: 1,344 Bytes
c08abba
 
 
 
 
 
 
 
 
 
 
 
 
 
af0f401
 
 
 
c08abba
 
 
afb233a
c08abba
 
 
af0f401
c08abba
 
 
af0f401
c08abba
 
 
 
 
 
 
af0f401
 
c08abba
 
 
 
 
af0f401
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
from dataclasses import dataclass
from enum import Enum

@dataclass
class Task:
    benchmark: str
    metric: str
    col_name: str


# Init: to update with your specific keys
class Tasks(Enum):
    # task_key in the json file, metric_key in the json file, name to display in the leaderboard 
    task0 = Task("MMLU", "metric_name", "MMLU")
    task1 = Task("task_1", "metric_name", "task_1")
    task2 = Task("task_2", "metric_name", "task_2")
    task3 = Task("task_3", "metric_name", "task_3")
    task4 = Task("task_4", "metric_name", "task_4")
    

# Your leaderboard name
TITLE = """<h1 align="center" id="space-title"> Azerbaijani LLM Leaderboard</h1>"""

# What does your leaderboard evaluate?
INTRODUCTION_TEXT = """
Welcome to Kapital Bank's Azerbaijani LLM Leaderboard. We use benchmarks in finance, banking, and general knowledge for accurate evaluations.

πŸš€ Submit Your Model πŸš€

If you have a fine-tuned Azerbaijani LLM, submit it for evaluation!

"""


EVALUATION_QUEUE_TEXT = """
## Some good practices before submitting a model

### 1) Make sure your model exists on hub.
### 2) Make sure your model is public.


## In case of model failure
If your model is displayed in the `FAILED` category, its execution stopped.
Make sure you have followed the above steps first.
Please contact us if you are facing any trouble!
"""