Spaces:
Sleeping
Sleeping
src/leaderboard/read_evals.py
CHANGED
@@ -118,7 +118,8 @@ class EvalResult:
|
|
118 |
|
119 |
def to_dict(self, tasks):
|
120 |
"""Converts the Eval Result to a dict compatible with our dataframe display"""
|
121 |
-
|
|
|
122 |
data_dict = {
|
123 |
"eval_name": self.eval_name, # not a column, just a save name,
|
124 |
AutoEvalColumn.architecture.name: self.architecture,
|
|
|
118 |
|
119 |
def to_dict(self, tasks):
|
120 |
"""Converts the Eval Result to a dict compatible with our dataframe display"""
|
121 |
+
avg_metrics = [v for k, v in self.results.items() if v is not None and " " not in k]
|
122 |
+
average = sum(avg_metrics) / len(avg_metrics)
|
123 |
data_dict = {
|
124 |
"eval_name": self.eval_name, # not a column, just a save name,
|
125 |
AutoEvalColumn.architecture.name: self.architecture,
|