xeon27 commited on
Commit
18638a9
·
1 Parent(s): cd53742

Replace missing values by None

Browse files
Files changed (2) hide show
  1. refactor_eval_results.py +1 -1
  2. src/populate.py +4 -0
refactor_eval_results.py CHANGED
@@ -96,7 +96,7 @@ def main():
96
  # TMP: Add dummy agentic benchmarks to the results
97
  for metric in METRIC_NAME.items():
98
  if metric[0] not in results["results"]:
99
- results["results"].update({metric[0]: {metric[1]: -1.0}})
100
  if os.path.isdir(os.path.join(agentic_bm_input_path, model_name)):
101
  agentic_bm_results = combine_eval_results(agentic_bm_input_path, model_name)
102
  results["results"].update(agentic_bm_results["results"])
 
96
  # TMP: Add dummy agentic benchmarks to the results
97
  for metric in METRIC_NAME.items():
98
  if metric[0] not in results["results"]:
99
+ results["results"].update({metric[0]: {metric[1]: None}})
100
  if os.path.isdir(os.path.join(agentic_bm_input_path, model_name)):
101
  agentic_bm_results = combine_eval_results(agentic_bm_input_path, model_name)
102
  results["results"].update(agentic_bm_results["results"])
src/populate.py CHANGED
@@ -41,8 +41,12 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
41
  df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
42
  df = df[cols].round(decimals=2)
43
 
 
 
44
  # filter out if any of the benchmarks have not been produced
45
  df = df[has_no_nan_values(df, benchmark_cols)]
 
 
46
 
47
  # make values clickable and link to log files
48
  for col in benchmark_cols:
 
41
  df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
42
  df = df[cols].round(decimals=2)
43
 
44
+ # TMP: Debug
45
+ print(df.shape())
46
  # filter out if any of the benchmarks have not been produced
47
  df = df[has_no_nan_values(df, benchmark_cols)]
48
+ # TMP: Debug
49
+ print(df.shape())
50
 
51
  # make values clickable and link to log files
52
  for col in benchmark_cols: