Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Update src/leaderboard/read_evals.py
Browse files
src/leaderboard/read_evals.py
CHANGED
@@ -67,28 +67,17 @@ class EvalResult:
|
|
67 |
architectures = getattr(model_config, "architectures", None)
|
68 |
if architectures:
|
69 |
architecture = ";".join(architectures)
|
70 |
-
|
71 |
-
# # Extract results available in this file (some results are split in several files)
|
72 |
-
# results = {}
|
73 |
-
# for task in Tasks:
|
74 |
-
# task = task.value
|
75 |
-
|
76 |
-
# # We average all scores of a given metric (not all metrics are present in all files)
|
77 |
-
# accs = np.array([v for k, v in data[task.benchmark].items() if task.metric == k])
|
78 |
-
# if accs.size == 0 or any([acc is None for acc in accs]):
|
79 |
-
# continue
|
80 |
-
|
81 |
-
# mean_acc = np.mean(accs) * 100.0
|
82 |
-
# results[task.benchmark] = mean_acc
|
83 |
if "scores" not in data:
|
84 |
raise KeyError(f"'scores' key not found in JSON file: {json_filepath}")
|
85 |
|
86 |
scores = data["scores"]
|
87 |
results = {}
|
88 |
for task in Tasks:
|
89 |
-
|
90 |
-
if
|
91 |
-
results[
|
|
|
92 |
|
93 |
return self(
|
94 |
eval_name=result_key,
|
|
|
67 |
architectures = getattr(model_config, "architectures", None)
|
68 |
if architectures:
|
69 |
architecture = ";".join(architectures)
|
70 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
71 |
if "scores" not in data:
|
72 |
raise KeyError(f"'scores' key not found in JSON file: {json_filepath}")
|
73 |
|
74 |
scores = data["scores"]
|
75 |
results = {}
|
76 |
for task in Tasks:
|
77 |
+
task_value = task.value
|
78 |
+
if task_value.metric in scores:
|
79 |
+
results[task_value.benchmark] = Decimal(scores[task_value.metric])
|
80 |
+
|
81 |
|
82 |
return self(
|
83 |
eval_name=result_key,
|