Fix new schema
Browse files
app.py
CHANGED
@@ -43,7 +43,7 @@ def get_leaderboard_df(merge_values: bool = False):
|
|
43 |
value = data["results"][first_result_key]["prompt_level_loose_acc"]
|
44 |
# MMLU has several metrics but we report just the average one
|
45 |
elif task.lower() == "mmlu":
|
46 |
-
value = data["results"]
|
47 |
# HellaSwag and ARC reports acc_norm
|
48 |
elif task.lower() in ["hellaswag", "arc"]:
|
49 |
value = data["results"][first_result_key]["acc_norm"]
|
@@ -102,6 +102,7 @@ with demo:
|
|
102 |
with gr.Row():
|
103 |
search_bar = gr.Textbox(placeholder="Search for your model...", show_label=False)
|
104 |
merge_values = gr.Checkbox(
|
|
|
105 |
label="Merge evals",
|
106 |
info="Merge evals for the same model. If there are duplicates, we display the largest one.",
|
107 |
)
|
|
|
43 |
value = data["results"][first_result_key]["prompt_level_loose_acc"]
|
44 |
# MMLU has several metrics but we report just the average one
|
45 |
elif task.lower() == "mmlu":
|
46 |
+
value = [v["acc"] for k, v in data["results"].items() if "_average" in k.lower()][0]
|
47 |
# HellaSwag and ARC reports acc_norm
|
48 |
elif task.lower() in ["hellaswag", "arc"]:
|
49 |
value = data["results"][first_result_key]["acc_norm"]
|
|
|
102 |
with gr.Row():
|
103 |
search_bar = gr.Textbox(placeholder="Search for your model...", show_label=False)
|
104 |
merge_values = gr.Checkbox(
|
105 |
+
value=True,
|
106 |
label="Merge evals",
|
107 |
info="Merge evals for the same model. If there are duplicates, we display the largest one.",
|
108 |
)
|