lewtun HF Staff commited on
Commit
9d1c3ff
·
1 Parent(s): 40f3905

Fix new schema

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -43,7 +43,7 @@ def get_leaderboard_df(merge_values: bool = False):
43
  value = data["results"][first_result_key]["prompt_level_loose_acc"]
44
  # MMLU has several metrics but we report just the average one
45
  elif task.lower() == "mmlu":
46
- value = data["results"]["lighteval|mmlu:_average|5"]["acc"]
47
  # HellaSwag and ARC reports acc_norm
48
  elif task.lower() in ["hellaswag", "arc"]:
49
  value = data["results"][first_result_key]["acc_norm"]
@@ -102,6 +102,7 @@ with demo:
102
  with gr.Row():
103
  search_bar = gr.Textbox(placeholder="Search for your model...", show_label=False)
104
  merge_values = gr.Checkbox(
 
105
  label="Merge evals",
106
  info="Merge evals for the same model. If there are duplicates, we display the largest one.",
107
  )
 
43
  value = data["results"][first_result_key]["prompt_level_loose_acc"]
44
  # MMLU has several metrics but we report just the average one
45
  elif task.lower() == "mmlu":
46
+ value = [v["acc"] for k, v in data["results"].items() if "_average" in k.lower()][0]
47
  # HellaSwag and ARC reports acc_norm
48
  elif task.lower() in ["hellaswag", "arc"]:
49
  value = data["results"][first_result_key]["acc_norm"]
 
102
  with gr.Row():
103
  search_bar = gr.Textbox(placeholder="Search for your model...", show_label=False)
104
  merge_values = gr.Checkbox(
105
+ value=True,
106
  label="Merge evals",
107
  info="Merge evals for the same model. If there are duplicates, we display the largest one.",
108
  )