xeon27 commited on
Commit
64ec699
·
1 Parent(s): 51b158d
Files changed (1) hide show
  1. src/populate.py +5 -1
src/populate.py CHANGED
@@ -9,6 +9,8 @@ from src.display.formatting import has_no_nan_values, make_clickable_model
9
  from src.display.utils import AutoEvalColumn, EvalQueueColumn
10
  from src.leaderboard.read_evals import get_raw_eval_results
11
 
 
 
12
 
13
  TASK_NAME_INVERSE_MAP = dict()
14
  for task in Tasks:
@@ -51,9 +53,11 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
51
 
52
  df = df.fillna(EMPTY_SYMBOL)
53
 
 
 
54
  # make values clickable and link to log files
55
  for col in benchmark_cols:
56
- df[col] = df[[AutoEvalColumn.model.name, col]].apply(lambda x: f"[{x[col]}]({get_inspect_log_url(model_name=x[AutoEvalColumn.model.name].split('>')[1].split('<')[0], benchmark_name=TASK_NAME_INVERSE_MAP[col]['name'])})" if x[col] != EMPTY_SYMBOL else x[col], axis=1)
57
 
58
  return df
59
 
 
9
  from src.display.utils import AutoEvalColumn, EvalQueueColumn
10
  from src.leaderboard.read_evals import get_raw_eval_results
11
 
12
+ from refactor_eval_results import MODEL_VERSION_MAP
13
+
14
 
15
  TASK_NAME_INVERSE_MAP = dict()
16
  for task in Tasks:
 
53
 
54
  df = df.fillna(EMPTY_SYMBOL)
55
 
56
+ inverse_model_version_map = {v: k for k, v in MODEL_VERSION_MAP.items()}
57
+
58
  # make values clickable and link to log files
59
  for col in benchmark_cols:
60
+ df[col] = df[[AutoEvalColumn.model.name, col]].apply(lambda x: f"[{x[col]}]({get_inspect_log_url(model_name=inverse_model_version_map[x[AutoEvalColumn.model.name].split('>')[1].split('<')[0]], benchmark_name=TASK_NAME_INVERSE_MAP[col]['name'])})" if x[col] != EMPTY_SYMBOL else x[col], axis=1)
61
 
62
  return df
63