File size: 27,128 Bytes
f0ad9ed
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f81e105
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f0ad9ed
 
 
 
 
f81e105
 
 
 
 
57f153a
f0ad9ed
57f153a
 
f81e105
f0ad9ed
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
import pandas as pd
import numpy as np
import gradio as gr
from urllib.parse import quote

def style_dataframe(df):
    if len(df) == 0:
        return df

    highlight_cols = ["Average", "IFEval", "BBHI", "MATH", "GPQA", "MUJB", "MMLU-PRO"]
    styled = df.style

    def highlight_green(val):
        try:
            val_float = float(str(val).replace('%', '').replace(' kg', ''))
            return f'background: linear-gradient(90deg, rgba(46, 125, 50, 0.5) {val_float}%, rgba(46, 125, 50, 0.1) {val_float}%); color: white;'
        except:
            return 'background-color: #121212; color: white;'

    for col in highlight_cols:
        styled = styled.applymap(highlight_green, subset=[col])

    styled = styled.set_properties(
        subset=["Model"],
        **{'color': '#4da6ff'}
    )

    return styled

def create_leaderboard_data():
    models = [
        {"model_name": "meta-llama/llama-3-70b-instruct", "type": "open"},
        {"model_name": "mistralai/Mistral-7B-Instruct-v0.3", "type": "open"},
        {"model_name": "google/gemma-7b-it", "type": "open"},
        {"model_name": "Qwen/Qwen2-7B-Instruct", "type": "open"},
        {"model_name": "anthropic/claude-3-opus", "type": "closed"},
        {"model_name": "OpenAI/gpt-4o", "type": "closed"},
        {"model_name": "01-ai/Yi-1.5-34B-Chat", "type": "open"},
        {"model_name": "google/gemma-2b", "type": "open"},
        {"model_name": "microsoft/phi-3-mini-4k-instruct", "type": "open"},
        {"model_name": "microsoft/phi-3-mini-128k-instruct", "type": "open"},
        {"model_name": "stabilityai/stable-beluga-7b", "type": "open"},
        {"model_name": "togethercomputer/RedPajama-INCITE-7B-Instruct", "type": "open"},
        {"model_name": "databricks/dbrx-instruct", "type": "closed"},
        {"model_name": "mosaicml/mpt-7b-instruct", "type": "open"},
        {"model_name": "01-ai/Yi-1.5-9B-Chat", "type": "open"}
    ]

    np.random.seed(42)

    rows = []
    for i, model in enumerate(models, 1):
        model_name = model["model_name"]
        model_type = model["type"]

        emoji = "🟢" if model_type.lower() == "open" else "🔴"
        type_with_emoji = f"{emoji} {model_type.upper()}"

        if "/" in model_name:
            org, name = model_name.split("/", 1)
            model_link = f"[{model_name}](https://huggingface.co/{quote(model_name)})"
        else:
            model_link = f"[{model_name}](https://huggingface.co/models?search={quote(model_name)})"

        average = round(np.random.uniform(40, 90), 2)
        ifeval = round(np.random.uniform(30, 90), 2)
        bbhi = round(np.random.uniform(40, 85), 2)
        math = round(np.random.uniform(20, 80), 2)
        gpqa = round(np.random.uniform(10, 70), 2)
        mujb = round(np.random.uniform(10, 70), 2)
        mmlu = round(np.random.uniform(40, 85), 2)
        co2_cost = round(np.random.uniform(1, 100), 2)

        rows.append([
            i,
            type_with_emoji,
            model_link,
            f"{average}",
            f"{ifeval}",
            f"{bbhi}",
            f"{math}",
            f"{gpqa}",
            f"{mujb}",
            f"{mmlu}",
            f"{co2_cost} kg"
        ])

    rows.sort(key=lambda x: float(x[3]), reverse=True)

    for i, row in enumerate(rows, 1):
        row[0] = i

    df = pd.DataFrame(rows, columns=["Rank", "Type", "Model", "Average", "IFEval", "BBHI", "MATH", "GPQA", "MUJB", "MMLU-PRO", "CO_Cost"])
    return style_dataframe(df)

def get_filter_data():
    return {
        "For Edge Devices": 5,
        "For Consumers": 4,
        "Mid-range": 4,
        "For the GPU-rich": 3,
        "Only Official Providers": 8
    }

css = """
.html-container {
    text-align: center;
    display: flex;
    justify-content: center;
    width: 100%;
}

.dataframe-container {
    margin-top: 0.5rem;
    margin-bottom: 0.5rem;
}

.leaderboard-title {
    font-size: 1.5rem;
    font-weight: bold;
    margin-bottom: 0.25rem;
    color: #f0f0f0;
}

.leaderboard-subtitle {
    font-size: 0.9rem;
    margin-bottom: 1rem;
    color: #a0a0a0;
}

.filters-container {
    margin-bottom: 0.5rem;
}

.hf-logo {
    height: 1.5rem;
    margin-right: 0.5rem;
}

.header-container {
    display: flex;
    align-items: center;
    justify-content: center;
    margin-bottom: 10px;
}

.header-container svg {
    margin-right: 0.5rem;
    flex-shrink: 0;
}
"""

filter_data = get_filter_data()
filter_choices = [f"{key} · {value}" for key, value in filter_data.items()]

# HF logo SVG content to embed directly
hf_logo_svg = """
<svg xmlns="http://www.w3.org/2000/svg" width="60" height="60" version="1.1" viewBox="0 0 236 220">
<g fill="none" stroke="none" stroke-width="1"><path d="M235.188 161.726a21.794 21.794 0 0 0-2.962-6.55 25.09 25.09 0 0 0 .654-3.21c.953-6.877-1.43-13.172-5.924-18.043-2.434-2.66-5.042-4.417-7.805-5.495a104.244 104.244 0 0 0 2.74-23.667c.006-3.638-.199-7.203-.545-10.715a125.62 125.62 0 0 0-.652-5.248 104.85 104.85 0 0 0-3.512-15.2 105.286 105.286 0 0 0-3.513-9.635 105.803 105.803 0 0 0-6.951-13.524 93.949 93.949 0 0 0-5.648-8.355 79.37 79.37 0 0 0-3.113-3.965 104 104 0 0 0-10.394-10.916 79.529 79.529 0 0 0-3.814-3.292 94.49 94.49 0 0 0-3.94-3.112 110.693 110.693 0 0 0-8.358-5.646C155.582 5.522 136.986 0 117.111 0 59.239 0 12.334 46.902 12.334 104.766a104.258 104.258 0 0 0 2.786 23.96c-2.486 1.08-4.87 2.76-7.077 5.194-4.493 4.868-6.877 11.142-5.923 18.017.144 1.093.362 2.174.652 3.238a21.868 21.868 0 0 0-2.962 6.55c-1.38 5.249-.926 9.98.83 14.127-1.908 5.42-1.43 11.193 1.053 16.21 1.807 3.665 4.392 6.5 7.58 9.034 3.788 3.01 8.531 5.57 14.254 8.026 6.826 2.91 15.157 5.646 18.947 6.65 9.788 2.534 19.173 4.14 28.686 4.217 13.55.127 25.222-3.06 33.578-11.215 4.105.503 8.236.755 12.372.754 4.37-.01 8.734-.286 13.07-.824 8.336 8.206 20.051 11.422 33.653 11.292 9.51-.075 18.896-1.68 28.659-4.22 3.814-1.002 12.143-3.738 18.973-6.647 5.723-2.47 10.465-5.029 14.28-8.03 3.163-2.54 5.746-5.37 7.554-9.04 2.51-5.019 2.962-10.79 1.08-16.21 1.727-4.146 2.178-8.889.798-14.133Zm-9.71 13.776c1.922 3.648 2.045 7.77.348 11.61-2.573 5.82-8.964 10.403-21.377 15.325-7.718 3.061-14.787 5.017-14.85 5.036-10.22 2.647-19.453 3.991-27.446 3.991-13.234 0-23.082-3.65-29.33-10.863a98.39 98.39 0 0 1-31.93.18c-6.251 7.093-16.045 10.683-29.17 10.683-7.993 0-17.225-1.344-27.435-3.99-.063-.02-7.127-1.976-14.85-5.037-12.41-4.922-18.803-9.502-21.375-15.325-1.697-3.84-1.574-7.962.35-11.61.177-.339.367-.67.57-.989A14.734 14.734 0 0 1 7 162.613c.766-2.902 2.344-5.316 4.487-7.05a14.685 14.685 0 0 1-1.99-5.548c-.618-4.273.8-8.54 3.992-12.02 2.485-2.707 5.998-4.197 9.89-4.197h.102a97.174 97.174 0 0 1-4.41-29.036c0-53.702 43.54-97.24 97.252-97.24 53.714 0 97.253 43.535 97.253 97.24a97.176 97.176 0 0 1-4.44 29.11c.468-.046.929-.07 1.38-.07 3.89 0 7.404 1.489 9.888 4.196 3.19 3.476 4.61 7.747 3.993 12.02a14.685 14.685 0 0 1-1.99 5.549c2.142 1.733 3.72 4.147 4.485 7.05a14.749 14.749 0 0 1-1.99 11.9c.206.315.398.646.574.985Z" fill="#FFF" fill-rule="nonzero"/><path d="M225.53 174.038a14.752 14.752 0 0 0 1.99-11.903c-.765-2.903-2.345-5.318-4.489-7.052a14.7 14.7 0 0 0 1.992-5.55c.617-4.274-.801-8.543-3.996-12.023-2.486-2.708-6.002-4.198-9.894-4.198-.453 0-.912.023-1.382.07a97.193 97.193 0 0 0 4.435-29.116C214.186 50.55 170.616 7 116.873 7s-97.317 43.546-97.317 97.266a97.164 97.164 0 0 0 4.413 29.044h-.103c-3.892 0-7.408 1.49-9.894 4.198-3.192 3.477-4.613 7.748-3.996 12.023.282 1.966.96 3.853 1.992 5.55-2.144 1.734-3.724 4.15-4.487 7.053a14.734 14.734 0 0 0 1.992 11.904c-.206.318-.395.65-.572.988-1.923 3.65-2.048 7.774-.35 11.614 2.574 5.82 8.971 10.407 21.392 15.33 7.723 3.061 14.797 5.018 14.86 5.036C55.017 209.656 64.256 211 72.254 211c13.134 0 22.933-3.59 29.192-10.686a98.495 98.495 0 0 0 31.951-.181c6.25 7.214 16.105 10.867 29.35 10.867 7.998 0 17.238-1.345 27.454-3.994.062-.018 7.132-1.975 14.859-5.037 12.42-4.922 18.818-9.508 21.391-15.33 1.699-3.84 1.575-7.963-.349-11.613a11.9 11.9 0 0 0-.573-.988Zm-128.562 15.17a39.223 39.223 0 0 1-1.73 2.756c-1.618 2.367-3.746 4.175-6.215 5.52-4.722 2.573-10.697 3.473-16.77 3.473-9.59 0-19.42-2.243-24.931-3.673-.27-.07-33.778-9.53-29.536-17.58.714-1.355 1.89-1.896 3.368-1.896 5.973 0 16.849 8.89 21.524 8.89 1.043 0 1.78-.445 2.08-1.528 1.992-7.142-30.276-10.144-27.558-20.484.48-1.83 1.78-2.572 3.61-2.572 7.895 0 25.62 13.88 29.326 13.88.284 0 .488-.084.599-.259l.048-.08c1.739-2.87.742-4.958-11.18-12.255l-1.143-.697c-13.116-7.935-22.323-12.71-17.086-18.407.602-.658 1.455-.95 2.493-.95 1.23 0 2.72.413 4.36 1.102 6.927 2.92 16.528 10.884 20.539 14.357 1.182 1.03 1.879 1.657 1.879 1.657s5.078 5.28 8.15 5.28c.706 0 1.305-.278 1.71-.967 2.18-3.67-20.222-20.636-21.486-27.636-.866-4.745.59-7.147 3.286-7.147 1.279 0 2.844.545 4.569 1.64 5.355 3.397 15.693 21.153 19.478 28.06 1.268 2.316 3.434 3.294 5.386 3.294 3.872 0 6.9-3.847.354-8.737-9.837-7.357-6.385-19.382-1.69-20.122.2-.032.403-.048.604-.049 4.27 0 6.154 7.355 6.154 7.355s5.52 13.855 15.003 23.325c8.605 8.596 9.806 15.651 4.793 24.45Zm30.664 1.622-.492.059-.84.096c-.44.045-.881.089-1.325.13l-.433.04-.394.033-.56.045c-.206.015-.413.03-.62.043l-.616.042-.136.008-.486.029-.206.01-.576.029-.67.027-.607.02-.404.013h-.205c-.127 0-.252.007-.38.008h-.2c-.127 0-.252 0-.38.007l-.514.005h-.72c-.566 0-1.13-.005-1.692-.016l-.456-.01c-.13 0-.26-.007-.388-.01l-.482-.015-.6-.023-.54-.023-.141-.006-.515-.028c-.143-.008-.286-.015-.427-.024l-.333-.02a91.779 91.779 0 0 1-1.254-.088l-.438-.035-.552-.047-.646-.06a57.45 57.45 0 0 1-1.082-.11h-.017c5.263-11.734 2.6-22.692-8.033-33.313-6.973-6.96-11.614-17.242-12.575-19.5-1.95-6.68-7.106-14.107-15.67-14.107a14.01 14.01 0 0 0-2.161.171c-3.753.59-7.032 2.75-9.372 5.997-2.528-3.144-4.986-5.642-7.21-7.055-3.35-2.122-6.692-3.2-9.951-3.2-4.065 0-7.7 1.67-10.233 4.697l-.064.077-.142-.6-.006-.025a85.253 85.253 0 0 1-1.214-6.23c0-.014 0-.028-.007-.042l-.071-.473c-.04-.255-.076-.512-.113-.767-.03-.213-.06-.426-.088-.638-.027-.212-.057-.425-.082-.638a64.55 64.55 0 0 1-.15-1.247l-.006-.052a89.658 89.658 0 0 1-.267-2.807l-.04-.542a27.47 27.47 0 0 1-.031-.45l-.017-.101-.037-.601a47.596 47.596 0 0 1-.037-.653 58.953 58.953 0 0 1-.032-.652l-.023-.57-.008-.173-.017-.527-.013-.446c0-.18-.008-.358-.012-.537l-.01-.563c-.001-.187 0-.374-.003-.561-.006-.18 0-.37 0-.56 0-48.17 39.07-87.22 87.268-87.22 48.197 0 87.268 39.05 87.268 87.225v1.127c0 .188-.005.377-.01.563 0 .157-.005.31-.01.466-.001.14-.007.279-.013.413 0 .176-.01.35-.016.527v.015c-.016.383-.031.765-.048 1.147l-.007.126-.03.57-.027.455a90.924 90.924 0 0 1-.251 3.212v.014l-.06.602-.155 1.398-.058.469-.073.55c-.025.2-.053.4-.082.603-.03.225-.064.448-.097.67l-.08.529-.095.598c-.032.2-.064.397-.102.596-.04.198-.07.396-.104.595a60.2 60.2 0 0 1-.217 1.186 104.22 104.22 0 0 1-.612 2.935c-2.457-2.386-5.71-3.685-9.297-3.685-3.255 0-6.602 1.076-9.951 3.2-2.225 1.41-4.681 3.91-7.211 7.054-2.343-3.25-5.623-5.408-9.37-5.998a14.168 14.168 0 0 0-2.163-.17c-8.566 0-13.72 7.428-15.67 14.109-.967 2.257-5.607 12.537-12.59 19.51-10.626 10.586-13.31 21.495-8.127 33.18Zm90.093-23.488-.035.102a5.71 5.71 0 0 1-.074.196 6.04 6.04 0 0 1-.51.95c-.192.286-.402.56-.632.817-.053.06-.103.12-.163.178a4.67 4.67 0 0 1-.25.26c-1.55 1.537-3.91 2.883-6.58 4.12-.301.136-.61.273-.92.41l-.31.137c-.203.09-.41.182-.625.27-.21.09-.424.179-.635.266l-.643.266c-1.503.618-3.042 1.206-4.545 1.789l-.64.248-.638.249c-.42.164-.838.329-1.25.494l-.61.246-.6.246-.296.123c-.195.083-.389.164-.58.247-4.418 1.894-7.597 3.822-6.93 6.215.02.068.04.132.064.194.06.177.14.345.242.502.06.094.13.183.207.264.785.814 2.214.686 4.016.039.147-.053.297-.11.448-.17.103-.039.206-.08.31-.121l.155-.066a33.9 33.9 0 0 0 1.295-.582c.113-.052.226-.103.339-.163 2.203-1.076 4.7-2.527 7.178-3.847.38-.206.76-.403 1.14-.6.62-.32 1.246-.63 1.877-.925 2.347-1.103 4.552-1.886 6.326-1.886.832 0 1.568.17 2.18.562l.1.068c.31.22.58.487.8.795.05.073.104.148.149.225.049.08.095.16.138.244.877 1.662.143 3.385-1.573 5.073-1.647 1.62-4.21 3.21-7.125 4.682-.215.11-.433.219-.652.325-8.672 4.256-20.026 7.46-20.184 7.5-3.027.785-7.354 1.815-12.228 2.585l-.722.112-.118.017a94.839 94.839 0 0 1-3.325.439l-.104.01c-2.02.23-4.091.397-6.167.467h-.031c-.747.028-1.492.04-2.238.04h-.86a54.33 54.33 0 0 1-3.407-.154c-.027 0-.054 0-.082-.005a43.83 43.83 0 0 1-3.298-.39c-.27-.043-.557-.09-.835-.14a19.884 19.884 0 0 1-.377-.07l-.03-.006c-.4-.076-.797-.16-1.193-.25-.23-.053-.46-.104-.687-.165l-.135-.036a14.137 14.137 0 0 1-.334-.088l-.061-.016-.356-.102c-.131-.037-.258-.075-.387-.113l-.046-.014-.336-.102-.378-.12c-.103-.035-.206-.071-.31-.105l-.226-.08a22.09 22.09 0 0 1-.652-.24l-.207-.078-.17-.068a27.61 27.61 0 0 1-.971-.412l-.214-.102-.036-.016c-.076-.036-.151-.072-.227-.104a19.743 19.743 0 0 1-.442-.22l-.044-.022-.212-.111a17.218 17.218 0 0 1-1.108-.63l-.198-.12c-.1-.062-.192-.125-.29-.19l-.258-.17a9.118 9.118 0 0 1-.278-.19l-.167-.118a15.402 15.402 0 0 1-.515-.386c-.09-.07-.18-.14-.268-.206-.196-.157-.39-.32-.58-.487l-.007-.006c-.185-.16-.366-.326-.542-.495l-.01-.012a11.813 11.813 0 0 1-.271-.266c-.09-.098-.18-.188-.265-.28a12.109 12.109 0 0 1-.26-.28 10.55 10.55 0 0 1-.246-.274l-.028-.03a17.27 17.27 0 0 1-1.165-1.514l-.143-.21c-.094-.14-.188-.28-.28-.42l-.272-.419a34.93 34.93 0 0 1-.66-1.059c-.074-.127-.15-.252-.22-.376a8.379 8.379 0 0 1-.117-.205c-.038-.073-.083-.145-.123-.218l-.066-.115c-.02-.038-.028-.05-.04-.075a12.086 12.086 0 0 1-.228-.417 8.435 8.435 0 0 0-.102-.182l-.104-.198-.101-.197-.198-.4a33.357 33.357 0 0 1-.291-.617c-.026-.056-.053-.112-.076-.169a13.103 13.103 0 0 1-.254-.583c-.055-.13-.104-.26-.157-.388-.15-.38-.288-.763-.416-1.15-.038-.116-.076-.23-.11-.345a13.436 13.436 0 0 1-.224-.79 13.83 13.83 0 0 1-.216-.94 13.172 13.172 0 0 1-.181-1.113 14.8 14.8 0 0 1-.1-1.105c0-.06-.006-.123-.007-.184a9.707 9.707 0 0 1-.01-.366c-.065-4.917 2.425-9.646 7.749-14.964 9.48-9.47 15.002-23.325 15.002-23.325s.148-.58.458-1.417c.103-.277.212-.554.326-.826.13-.309.27-.614.42-.913l.044-.088c.192-.382.4-.753.627-1.116.052-.084.103-.168.163-.25.168-.252.346-.495.534-.73.145-.18.3-.356.462-.522.55-.566 1.179-1.029 1.889-1.276l.088-.029a3.025 3.025 0 0 1 .394-.104l.033-.007c.15-.03.302-.05.455-.06h.014c.08 0 .158-.01.24-.01.204.001.407.017.608.05.855.133 1.67.642 2.37 1.427l.093.11c.228.267.436.553.62.852.138.22.268.454.39.7.05.103.098.197.145.3.023.05.046.101.068.154a11.557 11.557 0 0 1 .69 2.216c.14.703.22 1.414.242 2.13.01.313.01.63 0 .953-.005.122-.011.245-.02.37a13.766 13.766 0 0 1-.885 3.995l-.155.384a14.23 14.23 0 0 1-.86 1.718 15.28 15.28 0 0 1-.6.94l-.13.186a15.584 15.584 0 0 1-1.695 1.99 17.893 17.893 0 0 1-1.956 1.692 15.79 15.79 0 0 0-1.948 1.7c-1.73 1.815-2.133 3.416-1.744 4.63.046.137.1.272.163.402.14.282.33.54.55.766l.063.061c.064.061.13.12.198.176l.07.058c.168.13.345.246.53.346.053.028.103.057.164.085.254.126.52.228.794.305l.075.02.103.027.09.023.095.02.096.02.09.015c.07.013.138.023.206.032l.067.01.118.013.074.007.122.01h.07l.127.005h.4l.113-.006.132-.008.16-.015.15-.018c.03 0 .063-.01.1-.015a5.824 5.824 0 0 0 1.825-.585 6.043 6.043 0 0 0 1.335-.92l.162-.154c.026-.025.052-.049.076-.075.16-.16.31-.327.448-.503a6.87 6.87 0 0 0 .655-.99 264.026 264.026 0 0 1 7.083-12.099l.34-.542.341-.543c.171-.274.343-.546.515-.814l.173-.27.347-.54c.464-.72.931-1.43 1.4-2.135l.352-.525a123.949 123.949 0 0 1 2.103-3.023l.348-.477a63.365 63.365 0 0 1 2.364-3.063l.325-.389c.053-.065.103-.129.161-.192l.32-.368c.052-.06.103-.12.158-.18l.313-.349.154-.168c.15-.162.302-.322.456-.48.104-.103.2-.207.3-.302a12.036 12.036 0 0 1 1.921-1.597l.16-.102.163-.104a6.65 6.65 0 0 1 .313-.185c2.724-1.543 4.978-1.657 6.275-.36.786.786 1.22 2.087 1.197 3.898 0 .08 0 .16-.007.243v.09c0 .081-.007.165-.012.25 0 .102-.013.205-.023.308-.01.103-.015.182-.026.273 0 .031-.005.056-.009.084a6.98 6.98 0 0 1-.029.241c0 .025 0 .05-.01.075a5.115 5.115 0 0 1-.047.326c-.013.1-.03.2-.049.3-.008.058-.02.115-.028.172-.03.164-.07.326-.117.485a6.95 6.95 0 0 1-.324.871 12.3 12.3 0 0 1-.174.367c-.125.25-.265.506-.42.77-.077.13-.156.265-.24.4l-.13.204c-.13.207-.268.415-.41.625a30.251 30.251 0 0 1-1.136 1.528l-.18.228a61.886 61.886 0 0 1-1.56 1.864l-.423.478-.216.241c-.289.33-.585.652-.882.976l-.228.246c-.15.163-.309.33-.46.494-.154.167-.31.332-.467.498l-.474.5-.48.5-.486.503-.978 1.008c-4.67 4.787-9.59 9.558-11.255 12.532-.11.194-.21.393-.3.597-.237.54-.336 1.004-.27 1.378.023.123.067.241.131.348.094.163.208.312.34.446.06.06.123.116.193.167.342.244.756.37 1.176.356h.133l.134-.009.136-.018.112-.016a.307.307 0 0 0 .045-.008l.102-.02.028-.007.115-.024.04-.01.12-.03.145-.043a6.165 6.165 0 0 0 .894-.35c.05-.025.103-.048.152-.074l.153-.076a14.039 14.039 0 0 0 1.078-.623l.154-.102a2.39 2.39 0 0 0 .153-.104l.154-.102.08-.056.22-.154c.207-.143.4-.289.595-.437l.018-.013.308-.238c.423-.333.825-.67 1.188-.986l.24-.213.024-.02.126-.112c.297-.266.562-.515.783-.72l.09-.088.217-.206.13-.13.045-.045.014-.012.22-.223.01-.007.04-.037.05-.044.017-.015.044-.04.234-.206.13-.118a5.41 5.41 0 0 0 .207-.187l.158-.138c.028-.023.055-.05.084-.074l.165-.144.243-.212.128-.112c.5-.436 1.11-.962 1.81-1.555l.286-.24.475-.395.483-.406c.634-.524 1.316-1.083 2.036-1.663l.474-.378 1.239-.977c.168-.132.34-.264.515-.396a132.43 132.43 0 0 1 4.333-3.208l.443-.308c.309-.214.618-.427.927-.635l.28-.19a72.059 72.059 0 0 1 1.675-1.094l.28-.177.278-.173c.278-.172.556-.342.83-.507l.275-.163.552-.32c.18-.107.36-.209.54-.31l.108-.06.428-.235c.178-.097.356-.19.532-.28l.265-.136.256-.13c.585-.293 1.18-.565 1.786-.814l.246-.104a8.13 8.13 0 0 1 .484-.184c.16-.053.318-.109.473-.164.142-.047.28-.09.412-.133l.045-.013a4.62 4.62 0 0 1 .214-.06l.02-.007c.146-.042.29-.08.438-.114h.01a9.31 9.31 0 0 1 .63-.13 7.52 7.52 0 0 1 .808-.097 5.27 5.27 0 0 1 .38-.012h.098a4.179 4.179 0 0 1 .545.042h.023c.055.005.11.015.165.026.055.012.11.02.164.032h.018c.053.012.103.027.158.042.44.118.844.342 1.18.65l.029.03.059.058.057.06a6.346 6.346 0 0 1 1.132 1.647l.045.103a3.788 3.788 0 0 1 .112 2.76 5.722 5.722 0 0 1-.36.832l-.094.17a9.51 9.51 0 0 1-1.265 1.672l-.104.11a14.43 14.43 0 0 1-.942.913l-.122.11c-.253.225-.513.444-.775.658a28.872 28.872 0 0 1-.706.563 49.385 49.385 0 0 1-2.062 1.492 81.87 81.87 0 0 1-1.277.855c-.82.537-1.646 1.063-2.48 1.58-.24.147-.482.298-.73.448-2.264 1.393-4.775 2.882-7.453 4.501l-.694.421c-.76.463-1.476.905-2.15 1.325l-.34.214-.641.412c-.256.161-.504.32-.744.477a33.2 33.2 0 0 0-.533.343l-.343.226a47.78 47.78 0 0 0-.5.33l-.16.101c-.17.113-.337.225-.498.335l-.266.18-.31.215-.286.2c-.45.317-.897.641-1.34.97l-.153.117a31.2 31.2 0 0 0-.505.39l-.21.17a23.3 23.3 0 0 0-.973.823l-.14.131c-.082.075-.163.15-.24.224-.053.05-.102.102-.156.153l-.075.073c-.166.165-.326.334-.481.508l-.076.087a7.57 7.57 0 0 0-.447.567l-.058.083c-.15.218-.282.45-.395.69l-.04.084-.025.06-.02.05-.026.07c-.008.024-.024.067-.034.103a2.517 2.517 0 0 0-.104.423l-.012.077-.01.07-.005.068v.361c0 .03 0 .061.007.092a.899.899 0 0 0 .006.055c0 .03.008.06.01.09l.023.127v.006c.008.04.016.08.027.12.01.041.02.086.033.13a3.7 3.7 0 0 0 .135.383c0 .01.008.02.01.03.015.03.028.062.043.093a4.4 4.4 0 0 0 .189.385l.072.13.076.13.08.134a.47.47 0 0 0 .046.06l.027.03.029.024.03.024a.644.644 0 0 0 .066.04.872.872 0 0 0 .157.056c.664.151 2.03-.399 3.844-1.357l.328-.173.55-.299.27-.149c.193-.104.39-.219.589-.333l.365-.206c2.399-1.38 5.265-3.153 8.226-4.884.277-.163.555-.324.834-.485l.56-.357c.28-.162.558-.32.838-.477a91.851 91.851 0 0 1 3.617-1.95l.547-.277c.364-.18.724-.355 1.08-.525.69-.327 1.386-.637 2.09-.93l.386-.157.047-.016c2.043-.81 3.895-1.31 5.395-1.31a5.42 5.42 0 0 1 .968.08h.01c.103.018.196.04.29.063h.018c.138.033.274.076.405.13.105.038.206.083.304.136a2.89 2.89 0 0 1 1.137 1.038c.1.154.189.316.26.487.043.098.082.2.119.308.036.11.069.217.102.33.244.873.22 1.796-.07 2.655Z" fill="#FF9D00" fill-rule="nonzero"/><path d="M204.17 104.828v-.565C204.17 56.07 165.098 17 116.882 17c-48.214 0-87.3 39.071-87.3 87.263l-.002.19v.375c.006.187.008.375.007.563l.007.414.002.15.006.205c.002.11.005.22.005.33l.012.448.018.527.006.172.023.545v.025l.032.637v.016c.012.218.023.436.037.652.012.201.024.402.038.602l.004.036c.01.171.021.344.034.516l.004.045c.011.166.024.332.038.497l.002.032.023.288c.07.83.15 1.66.242 2.49l.006.05.07.608.08.64a78.863 78.863 0 0 0 .281 2.045l.005.03a84.93 84.93 0 0 0 1.288 6.717l.006.027.037.155c.034.148.07.295.106.444l.06-.078c2.53-3.028 6.17-4.698 10.231-4.698 3.26 0 6.605 1.077 9.956 3.201 2.224 1.412 4.682 3.913 7.211 7.058 2.341-3.25 5.622-5.41 9.375-6a14.05 14.05 0 0 1 2.163-.17c8.568 0 13.727 7.43 15.676 14.114.962 2.26 5.604 12.543 12.603 19.5 10.64 10.625 13.3 21.59 8.037 33.33h.018c.36.04.72.08 1.081.11l.646.07.076.006c.158.015.317.028.476.04l.438.037c.417.032.835.06 1.256.088l.33.021.265.015.165.009.514.028.142.005.542.023.6.024.485.014.08.004c.102.003.206.008.309.008l.11.002c.679.016 1.357.024 2.037.024h.72l.517-.007c.127-.006.252-.006.379-.006h.196l.174-.004a6.09 6.09 0 0 1 .205-.004h.207l.404-.012.608-.02.67-.03c.192-.007.383-.016.575-.026l.207-.012.305-.017.18-.01.134-.008.618-.042c.206-.012.413-.03.62-.045l.56-.043.394-.034.433-.04c.443-.04.885-.086 1.326-.13.28-.03.56-.064.84-.098l.49-.059c-5.18-11.69-2.5-22.606 8.097-33.19 6.983-6.974 11.625-17.26 12.593-19.518 1.95-6.684 7.106-14.115 15.675-14.115.724.001 1.448.058 2.163.172 3.75.59 7.032 2.75 9.376 6 2.53-3.146 4.987-5.647 7.21-7.06 3.351-2.123 6.7-3.2 9.955-3.2 3.59 0 6.843 1.3 9.3 3.687.135-.6.265-1.204.39-1.807.076-.377.15-.754.224-1.133.09-.465.175-.933.254-1.4.02-.125.042-.252.066-.38.038-.198.072-.395.103-.595l.013-.077.08-.525.082-.528v-.006c.033-.22.067-.443.097-.666l.07-.505.013-.097.07-.55.06-.47c.036-.307.07-.616.104-.926.015-.123.027-.247.04-.372l.011-.1c.023-.206.043-.41.06-.617l.046-.479c.096-1.06.173-2.122.233-3.185v-.007l.03-.564.006-.126.023-.536c.01-.2.017-.405.024-.61v-.016l.006-.15a7.99 7.99 0 0 0 .01-.378l.003-.05c.004-.118.01-.24.01-.36l.002-.104c.004-.12.007-.24.007-.362l.003-.102c.003-.155.006-.308.006-.462v-.562ZM95.23 192.004c6.914-10.136 6.424-17.742-3.062-27.22-9.486-9.476-15.007-23.335-15.007-23.335s-2.061-8.052-6.76-7.311c-4.7.74-8.148 12.769 1.691 20.132 9.84 7.364-1.957 12.357-5.744 5.447-3.789-6.911-14.129-24.675-19.49-28.073-5.362-3.398-9.132-1.494-7.868 5.51.627 3.476 6.465 9.408 11.92 14.952 5.534 5.625 10.672 10.847 9.575 12.695-2.181 3.67-9.86-4.312-9.86-4.312s-24.048-21.875-29.284-16.174c-4.825 5.254 2.616 9.72 14.085 16.604.975.586 1.98 1.19 3.008 1.81 13.12 7.942 14.141 10.037 12.28 13.04-.688 1.11-5.08-1.525-10.483-4.767-9.198-5.528-21.343-12.815-23.057-6.292-1.485 5.646 7.451 9.105 15.552 12.243 6.75 2.613 12.925 5.004 12.017 8.249-.94 3.363-6.044.558-11.62-2.51-6.26-3.443-13.12-7.217-15.366-2.96-4.243 8.05 29.271 17.526 29.547 17.595 10.828 2.807 38.326 8.756 47.938-5.323Zm44.539 0c-6.914-10.136-6.423-17.742 3.063-27.22 9.486-9.476 15.008-23.335 15.008-23.335s2.06-8.052 6.76-7.311c4.7.74 8.148 12.769-1.692 20.132-9.841 7.364 1.957 12.357 5.745 5.447 3.788-6.911 14.123-24.675 19.484-28.073 5.361-3.398 9.132-1.494 7.869 5.51-.628 3.476-6.466 9.41-11.921 14.953-5.533 5.624-10.672 10.846-9.574 12.694 2.18 3.67 9.866-4.317 9.866-4.317s24.046-21.875 29.282-16.174c4.82 5.254-2.62 9.722-14.09 16.607a712.74 712.74 0 0 0-3.01 1.81c-13.125 7.94-14.14 10.035-12.28 13.038.685 1.11 5.08-1.525 10.48-4.767 9.21-5.527 21.354-12.816 23.07-6.293 1.483 5.646-7.452 9.106-15.555 12.244-6.75 2.614-12.924 5.003-12.017 8.25.94 3.363 6.04.557 11.615-2.51 6.26-3.456 13.121-7.23 15.366-2.971 4.244 8.055-29.274 17.52-29.546 17.59-10.828 2.815-38.327 8.764-47.934-5.315Z" fill="#FFD21E"/><path d="M145.615 80.61c1.361.481 2.375 1.943 3.339 3.333 1.302 1.88 2.515 3.63 4.376 2.644a12.54 12.54 0 0 0 5.173-5.13 12.488 12.488 0 0 0-.277-12.346 12.556 12.556 0 0 0-8.925-5.962 12.615 12.615 0 0 0-5.496.392 12.58 12.58 0 0 0-6.077 4.028 12.515 12.515 0 0 0-2.809 6.71 12.493 12.493 0 0 0 1.408 7.137c.862 1.616 2.776.855 4.796.05 1.584-.631 3.233-1.288 4.492-.846Zm-59.232.002c-1.362.48-2.376 1.943-3.34 3.333-1.303 1.879-2.516 3.629-4.376 2.643a12.558 12.558 0 0 1-4.177-3.577 12.505 12.505 0 0 1-2.12-10.5 12.538 12.538 0 0 1 2.464-4.909 12.576 12.576 0 0 1 4.336-3.385 12.617 12.617 0 0 1 10.75-.023 12.573 12.573 0 0 1 4.351 3.366 12.484 12.484 0 0 1 1.4 13.848c-.864 1.616-2.778.854-4.797.048-1.583-.63-3.232-1.287-4.49-.844Zm50.068 53.706c9.39-7.37 12.837-19.402 12.837-26.814 0-5.858-3.957-4.014-10.29-.89l-.356.176c-5.814 2.868-13.552 6.687-22.047 6.687-8.496 0-16.234-3.82-22.046-6.688-6.538-3.227-10.639-5.251-10.639.717 0 7.645 3.67 20.2 13.74 27.494a21.775 21.775 0 0 1 5.494-7.009 21.863 21.863 0 0 1 7.85-4.233c1.004-.298 2.04 1.426 3.1 3.19 1.023 1.704 2.067 3.445 3.132 3.445 1.132 0 2.245-1.716 3.333-3.392 1.135-1.75 2.242-3.458 3.313-3.116a21.845 21.845 0 0 1 12.58 10.433Z" fill="#32343D"/><path d="M136 134.59c-4.915 3.837-11.447 6.41-19.954 6.41-7.993 0-14.245-2.271-19.046-5.729a21.81 21.81 0 0 1 5.524-7.003 22.042 22.042 0 0 1 7.889-4.234c1.985-.587 4.087 6.632 6.264 6.632 2.33 0 4.575-7.173 6.682-6.506a21.939 21.939 0 0 1 12.63 10.43Z" fill="#FF323D" fill-rule="nonzero"/><path d="M63.71 90.637a8.248 8.248 0 0 1-2.943 1.206 8.326 8.326 0 0 1-3.19.006 8.266 8.266 0 0 1-2.946-1.193 8.082 8.082 0 0 1-2.256-2.21 7.917 7.917 0 0 1-1.22-2.89 7.856 7.856 0 0 1 .004-3.129 7.927 7.927 0 0 1 1.226-2.887 8.084 8.084 0 0 1 2.26-2.205 8.286 8.286 0 0 1 6.114-1.179 8.165 8.165 0 0 1 5.178 3.399 7.876 7.876 0 0 1 1.22 5.992 7.995 7.995 0 0 1-3.448 5.09Zm116.687 0c-.89.588-1.89.998-2.942 1.206a8.325 8.325 0 0 1-3.188.006 8.269 8.269 0 0 1-2.948-1.193 8.075 8.075 0 0 1-2.255-2.21 7.869 7.869 0 0 1 .01-8.905 8.086 8.086 0 0 1 2.26-2.206 8.287 8.287 0 0 1 6.113-1.179 8.167 8.167 0 0 1 5.178 3.399 7.876 7.876 0 0 1 1.22 5.992 7.995 7.995 0 0 1-3.448 5.09Z" fill="#FFAD03"/></g></svg>
"""

with gr.Blocks(css=css) as demo:
    gr.HTML(f"""
        <div class="header-container">
            <div>{hf_logo_svg}</div><br />
            <div class="leaderboard-title">Open LLM Leaderboard</div>
        </div>
        <div class="leaderboard-subtitle">Comparing Large Language Models in an open and reproducible way</div>
    """)

    with gr.Row():
        filters = gr.CheckboxGroup(
            label="Quick Filters",
            choices=filter_choices,
        )

    with gr.Row():
        status_text = gr.HTML("<div style='text-align: right; color: #888; font-size: 0.8rem;'>Last updated: June 25, 2024 at 10:30 AM</div>")

    leaderboard_df = create_leaderboard_data()
    leaderboard_table = gr.Dataframe(
        value=leaderboard_df,
        headers=["Rank", "Type", "Model", "Average", "IFEval", "BBHI", "MATH", "GPQA", "MUJB", "MMLU-PRO", "CO_Cost"],
        datatype=["number", "str", "markdown", "str", "str", "str", "str", "str", "str", "str", "str"],
        elem_id="leaderboard-table",
        interactive=False,
        max_height=600,
        show_search="search",
        show_copy_button=True,
        show_fullscreen_button=True,
        pinned_columns=2,
        column_widths=["5%", "7%", "35%", "7%", "7%", "7%", "7%", "7%", "7%", "7%", "6%"]
    )

    refresh_btn = gr.Button("Refresh Data")
    refresh_btn.click(fn=lambda: create_leaderboard_data(), outputs=leaderboard_table)

if __name__ == "__main__":
    demo.launch()