Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -53,7 +53,7 @@ except Exception:
|
|
53 |
|
54 |
LEADERBOARD_DF = get_leaderboard_df(EVAL_RESULTS_PATH, EVAL_REQUESTS_PATH, COLS, BENCHMARK_COLS)
|
55 |
_test_data = pd.DataFrame({"Score": [54,46,53], "Name": ["MageBench", "MageBench", "MageBench"], "BaseModel": ["GPT-4o", "GPT-4o", "LLaMA"], "Env.": ["Sokoban", "Sokoban", "Football"],
|
56 |
-
"Target-research": ["Model-Eval-Global", "Model-Eval-Online", "Agent-Eval-Prompt"], "Link": ["xxx", "xxx", "xxx"]})
|
57 |
|
58 |
|
59 |
(
|
@@ -79,6 +79,7 @@ def init_leaderboard(dataframe):
|
|
79 |
ColumnFilter("Target-research", type="checkboxgroup", label="Comparison settings for target researches (Single Selection)"),
|
80 |
ColumnFilter("BaseModel", type="dropdown", label="Select The base lmm model that fultill the task."),
|
81 |
ColumnFilter("Env.", type="checkboxgroup", label="Environment (Single Selection)"),
|
|
|
82 |
# ColumnFilter(AutoEvalColumn.precision.name, type="checkboxgroup", label="Precision"),
|
83 |
# ColumnFilter(
|
84 |
# AutoEvalColumn.params.name,
|
|
|
53 |
|
54 |
LEADERBOARD_DF = get_leaderboard_df(EVAL_RESULTS_PATH, EVAL_REQUESTS_PATH, COLS, BENCHMARK_COLS)
|
55 |
_test_data = pd.DataFrame({"Score": [54,46,53], "Name": ["MageBench", "MageBench", "MageBench"], "BaseModel": ["GPT-4o", "GPT-4o", "LLaMA"], "Env.": ["Sokoban", "Sokoban", "Football"],
|
56 |
+
"Target-research": ["Model-Eval-Global", "Model-Eval-Online", "Agent-Eval-Prompt"], "Subset": ["mini", "all", "mini"], "Link": ["xxx", "xxx", "xxx"]})
|
57 |
|
58 |
|
59 |
(
|
|
|
79 |
ColumnFilter("Target-research", type="checkboxgroup", label="Comparison settings for target researches (Single Selection)"),
|
80 |
ColumnFilter("BaseModel", type="dropdown", label="Select The base lmm model that fultill the task."),
|
81 |
ColumnFilter("Env.", type="checkboxgroup", label="Environment (Single Selection)"),
|
82 |
+
ColumnFilter("Subset", type="checkboxgroup", label="Subset (Single Selection)"),
|
83 |
# ColumnFilter(AutoEvalColumn.precision.name, type="checkboxgroup", label="Precision"),
|
84 |
# ColumnFilter(
|
85 |
# AutoEvalColumn.params.name,
|