Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -175,7 +175,7 @@ def build_basic_stats_tab():
|
|
175 |
md4 = gr.Markdown(empty)
|
176 |
return [md0, plot_1, md1, md2, md3, md4]
|
177 |
|
178 |
-
def get_full_table(
|
179 |
values = []
|
180 |
for i in range(len(model_table_df)):
|
181 |
row = []
|
@@ -183,11 +183,7 @@ def get_full_table(arena_df, model_table_df):
|
|
183 |
model_name = model_table_df.iloc[i]["Model"]
|
184 |
# model display name
|
185 |
row.append(model_name)
|
186 |
-
|
187 |
-
idx = arena_df.index.get_loc(model_key)
|
188 |
-
row.append(round(arena_df.iloc[idx]["rating"]))
|
189 |
-
else:
|
190 |
-
row.append(np.nan)
|
191 |
row.append(model_table_df.iloc[i]["MT-bench (score)"])
|
192 |
row.append(model_table_df.iloc[i]["MMLU"])
|
193 |
# Organization
|
@@ -313,9 +309,49 @@ def build_leaderboard_tab(elo_results_file, leaderboard_table_file, show_plot=Fa
|
|
313 |
with gr.Tabs() as tabs:
|
314 |
# arena table
|
315 |
arena_table_vals = get_arena_table(arena_df, model_table_df)
|
316 |
-
with gr.Tab("Arena Elo", id=0):
|
317 |
-
|
318 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
319 |
with gr.Row():
|
320 |
with gr.Column(scale=2):
|
321 |
category_dropdown = gr.Dropdown(choices=list(arena_dfs.keys()), label="Category", value="Overall")
|
@@ -323,40 +359,7 @@ def build_leaderboard_tab(elo_results_file, leaderboard_table_file, show_plot=Fa
|
|
323 |
with gr.Column(scale=4, variant="panel"):
|
324 |
category_deets = gr.Markdown(default_category_details, elem_id="category_deets")
|
325 |
|
326 |
-
|
327 |
-
headers=[
|
328 |
-
"Rank",
|
329 |
-
"🤖 Model",
|
330 |
-
"⭐ Arena Elo",
|
331 |
-
"Organization",
|
332 |
-
"License",
|
333 |
-
],
|
334 |
-
datatype=[
|
335 |
-
"number",
|
336 |
-
"markdown",
|
337 |
-
"number",
|
338 |
-
"str",
|
339 |
-
"str",
|
340 |
-
],
|
341 |
-
value=arena_table_vals,
|
342 |
-
elem_id="arena_leaderboard_dataframe",
|
343 |
-
height=700,
|
344 |
-
column_widths=[70, 190, 110, 160, 150, 140],
|
345 |
-
wrap=True,
|
346 |
-
)
|
347 |
-
|
348 |
-
gr.Markdown(
|
349 |
-
f"""Note: .
|
350 |
-
""",
|
351 |
-
elem_id="leaderboard_markdown"
|
352 |
-
)
|
353 |
-
|
354 |
-
leader_component_values[:] = [default_md]
|
355 |
-
|
356 |
-
with gr.Tab("Full Leaderboard", id=1):
|
357 |
-
md = make_full_leaderboard_md(elo_results)
|
358 |
-
gr.Markdown(md, elem_id="leaderboard_markdown")
|
359 |
-
full_table_vals = get_full_table(arena_df, model_table_df)
|
360 |
gr.Dataframe(
|
361 |
headers=[
|
362 |
"🤖 Model",
|
@@ -375,7 +378,7 @@ def build_leaderboard_tab(elo_results_file, leaderboard_table_file, show_plot=Fa
|
|
375 |
)
|
376 |
if not show_plot:
|
377 |
gr.Markdown(
|
378 |
-
""" ##
|
379 |
""",
|
380 |
elem_id="leaderboard_markdown",
|
381 |
)
|
|
|
175 |
md4 = gr.Markdown(empty)
|
176 |
return [md0, plot_1, md1, md2, md3, md4]
|
177 |
|
178 |
+
def get_full_table(model_table_df):
|
179 |
values = []
|
180 |
for i in range(len(model_table_df)):
|
181 |
row = []
|
|
|
183 |
model_name = model_table_df.iloc[i]["Model"]
|
184 |
# model display name
|
185 |
row.append(model_name)
|
186 |
+
row.append(np.nan)
|
|
|
|
|
|
|
|
|
187 |
row.append(model_table_df.iloc[i]["MT-bench (score)"])
|
188 |
row.append(model_table_df.iloc[i]["MMLU"])
|
189 |
# Organization
|
|
|
309 |
with gr.Tabs() as tabs:
|
310 |
# arena table
|
311 |
arena_table_vals = get_arena_table(arena_df, model_table_df)
|
312 |
+
# with gr.Tab("Arena Elo", id=0):
|
313 |
+
# md = make_arena_leaderboard_md(arena_df)
|
314 |
+
# leaderboard_markdown = gr.Markdown(md, elem_id="leaderboard_markdown")
|
315 |
+
# with gr.Row():
|
316 |
+
# with gr.Column(scale=2):
|
317 |
+
# category_dropdown = gr.Dropdown(choices=list(arena_dfs.keys()), label="Category", value="Overall")
|
318 |
+
# default_category_details = make_category_arena_leaderboard_md(arena_df, arena_df, name="Overall")
|
319 |
+
# with gr.Column(scale=4, variant="panel"):
|
320 |
+
# category_deets = gr.Markdown(default_category_details, elem_id="category_deets")
|
321 |
+
|
322 |
+
# elo_display_df = gr.Dataframe(
|
323 |
+
# headers=[
|
324 |
+
# "Rank",
|
325 |
+
# "🤖 Model",
|
326 |
+
# "⭐ Arena Elo",
|
327 |
+
# "Organization",
|
328 |
+
# "License",
|
329 |
+
# ],
|
330 |
+
# datatype=[
|
331 |
+
# "number",
|
332 |
+
# "markdown",
|
333 |
+
# "number",
|
334 |
+
# "str",
|
335 |
+
# "str",
|
336 |
+
# ],
|
337 |
+
# value=arena_table_vals,
|
338 |
+
# elem_id="arena_leaderboard_dataframe",
|
339 |
+
# height=700,
|
340 |
+
# column_widths=[70, 190, 110, 160, 150, 140],
|
341 |
+
# wrap=True,
|
342 |
+
# )
|
343 |
+
|
344 |
+
# gr.Markdown(
|
345 |
+
# f"""Note: .
|
346 |
+
# """,
|
347 |
+
# elem_id="leaderboard_markdown"
|
348 |
+
# )
|
349 |
+
|
350 |
+
# leader_component_values[:] = [default_md]
|
351 |
+
|
352 |
+
with gr.Tab("Full Leaderboard", id=0):
|
353 |
+
md = make_full_leaderboard_md(elo_results)
|
354 |
+
gr.Markdown(md, elem_id="leaderboard_markdown")
|
355 |
with gr.Row():
|
356 |
with gr.Column(scale=2):
|
357 |
category_dropdown = gr.Dropdown(choices=list(arena_dfs.keys()), label="Category", value="Overall")
|
|
|
359 |
with gr.Column(scale=4, variant="panel"):
|
360 |
category_deets = gr.Markdown(default_category_details, elem_id="category_deets")
|
361 |
|
362 |
+
full_table_vals = get_full_table(model_table_df)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
363 |
gr.Dataframe(
|
364 |
headers=[
|
365 |
"🤖 Model",
|
|
|
378 |
)
|
379 |
if not show_plot:
|
380 |
gr.Markdown(
|
381 |
+
""" ## Submit your model [here]().
|
382 |
""",
|
383 |
elem_id="leaderboard_markdown",
|
384 |
)
|