xeon27
commited on
Commit
·
a2f2df3
1
Parent(s):
18638a9
Remove column for average
Browse files- src/display/utils.py +1 -1
- src/leaderboard/read_evals.py +2 -2
- src/populate.py +1 -1
src/display/utils.py
CHANGED
@@ -26,7 +26,7 @@ auto_eval_column_dict = []
|
|
26 |
# auto_eval_column_dict.append(["model_type_symbol", ColumnContent, ColumnContent("T", "str", True, never_hidden=True)])
|
27 |
auto_eval_column_dict.append(["model", ColumnContent, ColumnContent("Model", "markdown", True, never_hidden=True)])
|
28 |
#Scores
|
29 |
-
auto_eval_column_dict.append(["average", ColumnContent, ColumnContent("Average ⬆️", "markdown", True)])
|
30 |
for task in Tasks:
|
31 |
auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "markdown", True)])
|
32 |
# # Model information
|
|
|
26 |
# auto_eval_column_dict.append(["model_type_symbol", ColumnContent, ColumnContent("T", "str", True, never_hidden=True)])
|
27 |
auto_eval_column_dict.append(["model", ColumnContent, ColumnContent("Model", "markdown", True, never_hidden=True)])
|
28 |
#Scores
|
29 |
+
# auto_eval_column_dict.append(["average", ColumnContent, ColumnContent("Average ⬆️", "markdown", True)])
|
30 |
for task in Tasks:
|
31 |
auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "markdown", True)])
|
32 |
# # Model information
|
src/leaderboard/read_evals.py
CHANGED
@@ -109,7 +109,7 @@ class EvalResult:
|
|
109 |
|
110 |
def to_dict(self):
|
111 |
"""Converts the Eval Result to a dict compatible with our dataframe display"""
|
112 |
-
average = sum([v for v in self.results.values() if v is not None]) / len(Tasks)
|
113 |
data_dict = {
|
114 |
"eval_name": self.eval_name, # not a column, just a save name,
|
115 |
# AutoEvalColumn.precision.name: self.precision.value.name,
|
@@ -119,7 +119,7 @@ class EvalResult:
|
|
119 |
# AutoEvalColumn.architecture.name: self.architecture,
|
120 |
AutoEvalColumn.model.name: make_clickable_model(self.full_model),
|
121 |
# AutoEvalColumn.revision.name: self.revision,
|
122 |
-
AutoEvalColumn.average.name: average,
|
123 |
AutoEvalColumn.license.name: self.license,
|
124 |
# AutoEvalColumn.likes.name: self.likes,
|
125 |
# AutoEvalColumn.params.name: self.num_params,
|
|
|
109 |
|
110 |
def to_dict(self):
|
111 |
"""Converts the Eval Result to a dict compatible with our dataframe display"""
|
112 |
+
# average = sum([v for v in self.results.values() if v is not None]) / len(Tasks)
|
113 |
data_dict = {
|
114 |
"eval_name": self.eval_name, # not a column, just a save name,
|
115 |
# AutoEvalColumn.precision.name: self.precision.value.name,
|
|
|
119 |
# AutoEvalColumn.architecture.name: self.architecture,
|
120 |
AutoEvalColumn.model.name: make_clickable_model(self.full_model),
|
121 |
# AutoEvalColumn.revision.name: self.revision,
|
122 |
+
# AutoEvalColumn.average.name: average,
|
123 |
AutoEvalColumn.license.name: self.license,
|
124 |
# AutoEvalColumn.likes.name: self.likes,
|
125 |
# AutoEvalColumn.params.name: self.num_params,
|
src/populate.py
CHANGED
@@ -38,7 +38,7 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
|
|
38 |
|
39 |
df = pd.DataFrame.from_records(all_data_json)
|
40 |
|
41 |
-
df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
42 |
df = df[cols].round(decimals=2)
|
43 |
|
44 |
# TMP: Debug
|
|
|
38 |
|
39 |
df = pd.DataFrame.from_records(all_data_json)
|
40 |
|
41 |
+
# df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
42 |
df = df[cols].round(decimals=2)
|
43 |
|
44 |
# TMP: Debug
|