xeon27 commited on
Commit
e004342
·
1 Parent(s): 0dddab1

Add tmp code

Browse files
Files changed (1) hide show
  1. refactor_eval_results.py +4 -0
refactor_eval_results.py CHANGED
@@ -70,6 +70,10 @@ def main():
70
  for model_name in os.listdir(base_bm_input_path):
71
  if os.path.isdir(os.path.join(base_bm_input_path, model_name)):
72
  results = combine_eval_results(base_bm_input_path, model_name)
 
 
 
 
73
  if os.path.isdir(os.path.join(agentic_bm_input_path, model_name)):
74
  agentic_bm_results = combine_eval_results(agentic_bm_input_path, model_name)
75
  results["results"].update(agentic_bm_results["results"])
 
70
  for model_name in os.listdir(base_bm_input_path):
71
  if os.path.isdir(os.path.join(base_bm_input_path, model_name)):
72
  results = combine_eval_results(base_bm_input_path, model_name)
73
+ # TMP: Add dummy agentic benchmarks to the results
74
+ for metric in METRIC_NAME.items():
75
+ if metric[0] not in results["results"]:
76
+ results["results"].update({metric[0]: {metric[1]: -1.0}})
77
  if os.path.isdir(os.path.join(agentic_bm_input_path, model_name)):
78
  agentic_bm_results = combine_eval_results(agentic_bm_input_path, model_name)
79
  results["results"].update(agentic_bm_results["results"])