Spaces:
Sleeping
Sleeping
src/leaderboard/read_evals.py
CHANGED
@@ -178,6 +178,7 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
178 |
version = results_path.split("/")[-1]
|
179 |
print(version)
|
180 |
tasks = N_Tasks if "n_" in version else Tasks
|
|
|
181 |
|
182 |
eval_results = {}
|
183 |
for model_result_filepath in model_result_filepaths:
|
@@ -192,7 +193,7 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
192 |
eval_results[eval_name].results.update({k: v for k, v in eval_result.results.items() if v is not None})
|
193 |
else:
|
194 |
eval_results[eval_name] = eval_result
|
195 |
-
|
196 |
results = []
|
197 |
for v in eval_results.values():
|
198 |
try:
|
@@ -200,5 +201,4 @@ def get_raw_eval_results(results_path: str, requests_path: str) -> list[EvalResu
|
|
200 |
results.append(v)
|
201 |
except KeyError: # not all eval values present
|
202 |
continue
|
203 |
-
|
204 |
return results
|
|
|
178 |
version = results_path.split("/")[-1]
|
179 |
print(version)
|
180 |
tasks = N_Tasks if "n_" in version else Tasks
|
181 |
+
print(tasks)
|
182 |
|
183 |
eval_results = {}
|
184 |
for model_result_filepath in model_result_filepaths:
|
|
|
193 |
eval_results[eval_name].results.update({k: v for k, v in eval_result.results.items() if v is not None})
|
194 |
else:
|
195 |
eval_results[eval_name] = eval_result
|
196 |
+
print(eval_results)
|
197 |
results = []
|
198 |
for v in eval_results.values():
|
199 |
try:
|
|
|
201 |
results.append(v)
|
202 |
except KeyError: # not all eval values present
|
203 |
continue
|
|
|
204 |
return results
|