xeon27
commited on
Commit
·
64ec699
1
Parent(s):
51b158d
Fix bug
Browse files- src/populate.py +5 -1
src/populate.py
CHANGED
@@ -9,6 +9,8 @@ from src.display.formatting import has_no_nan_values, make_clickable_model
|
|
9 |
from src.display.utils import AutoEvalColumn, EvalQueueColumn
|
10 |
from src.leaderboard.read_evals import get_raw_eval_results
|
11 |
|
|
|
|
|
12 |
|
13 |
TASK_NAME_INVERSE_MAP = dict()
|
14 |
for task in Tasks:
|
@@ -51,9 +53,11 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
|
|
51 |
|
52 |
df = df.fillna(EMPTY_SYMBOL)
|
53 |
|
|
|
|
|
54 |
# make values clickable and link to log files
|
55 |
for col in benchmark_cols:
|
56 |
-
df[col] = df[[AutoEvalColumn.model.name, col]].apply(lambda x: f"[{x[col]}]({get_inspect_log_url(model_name=x[AutoEvalColumn.model.name].split('>')[1].split('<')[0], benchmark_name=TASK_NAME_INVERSE_MAP[col]['name'])})" if x[col] != EMPTY_SYMBOL else x[col], axis=1)
|
57 |
|
58 |
return df
|
59 |
|
|
|
9 |
from src.display.utils import AutoEvalColumn, EvalQueueColumn
|
10 |
from src.leaderboard.read_evals import get_raw_eval_results
|
11 |
|
12 |
+
from refactor_eval_results import MODEL_VERSION_MAP
|
13 |
+
|
14 |
|
15 |
TASK_NAME_INVERSE_MAP = dict()
|
16 |
for task in Tasks:
|
|
|
53 |
|
54 |
df = df.fillna(EMPTY_SYMBOL)
|
55 |
|
56 |
+
inverse_model_version_map = {v: k for k, v in MODEL_VERSION_MAP.items()}
|
57 |
+
|
58 |
# make values clickable and link to log files
|
59 |
for col in benchmark_cols:
|
60 |
+
df[col] = df[[AutoEvalColumn.model.name, col]].apply(lambda x: f"[{x[col]}]({get_inspect_log_url(model_name=inverse_model_version_map[x[AutoEvalColumn.model.name].split('>')[1].split('<')[0]], benchmark_name=TASK_NAME_INVERSE_MAP[col]['name'])})" if x[col] != EMPTY_SYMBOL else x[col], axis=1)
|
61 |
|
62 |
return df
|
63 |
|