xeon27
commited on
Commit
·
18638a9
1
Parent(s):
cd53742
Replace missing values by None
Browse files- refactor_eval_results.py +1 -1
- src/populate.py +4 -0
refactor_eval_results.py
CHANGED
@@ -96,7 +96,7 @@ def main():
|
|
96 |
# TMP: Add dummy agentic benchmarks to the results
|
97 |
for metric in METRIC_NAME.items():
|
98 |
if metric[0] not in results["results"]:
|
99 |
-
results["results"].update({metric[0]: {metric[1]:
|
100 |
if os.path.isdir(os.path.join(agentic_bm_input_path, model_name)):
|
101 |
agentic_bm_results = combine_eval_results(agentic_bm_input_path, model_name)
|
102 |
results["results"].update(agentic_bm_results["results"])
|
|
|
96 |
# TMP: Add dummy agentic benchmarks to the results
|
97 |
for metric in METRIC_NAME.items():
|
98 |
if metric[0] not in results["results"]:
|
99 |
+
results["results"].update({metric[0]: {metric[1]: None}})
|
100 |
if os.path.isdir(os.path.join(agentic_bm_input_path, model_name)):
|
101 |
agentic_bm_results = combine_eval_results(agentic_bm_input_path, model_name)
|
102 |
results["results"].update(agentic_bm_results["results"])
|
src/populate.py
CHANGED
@@ -41,8 +41,12 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
|
|
41 |
df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
42 |
df = df[cols].round(decimals=2)
|
43 |
|
|
|
|
|
44 |
# filter out if any of the benchmarks have not been produced
|
45 |
df = df[has_no_nan_values(df, benchmark_cols)]
|
|
|
|
|
46 |
|
47 |
# make values clickable and link to log files
|
48 |
for col in benchmark_cols:
|
|
|
41 |
df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
42 |
df = df[cols].round(decimals=2)
|
43 |
|
44 |
+
# TMP: Debug
|
45 |
+
print(df.shape())
|
46 |
# filter out if any of the benchmarks have not been produced
|
47 |
df = df[has_no_nan_values(df, benchmark_cols)]
|
48 |
+
# TMP: Debug
|
49 |
+
print(df.shape())
|
50 |
|
51 |
# make values clickable and link to log files
|
52 |
for col in benchmark_cols:
|