Spaces:
Sleeping
Sleeping
app.py
CHANGED
@@ -96,10 +96,10 @@ with demo:
|
|
96 |
gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
|
97 |
|
98 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
99 |
-
with gr.TabItem("π
|
100 |
leaderboard = init_leaderboard(LEADERBOARD_DF)
|
101 |
|
102 |
-
with gr.TabItem("π
|
103 |
leaderboard = init_leaderboard(LEADERBOARD_DF_N_CORRECT)
|
104 |
|
105 |
with gr.TabItem("π About", elem_id="llm-benchmark-tab-table-n-correct", id=2):
|
@@ -153,7 +153,7 @@ with demo:
|
|
153 |
revision_name_textbox = gr.Textbox(label="Revision commit", placeholder="main")
|
154 |
output_format = gr.Textbox(label="Output format", placeholder="Out-GEN")
|
155 |
version = gr.Dropdown(
|
156 |
-
["1_correct", "1_correct_var", "n_correct",], value=
|
157 |
)
|
158 |
|
159 |
with gr.Row():
|
|
|
96 |
gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
|
97 |
|
98 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
99 |
+
with gr.TabItem("π
1 Correct", elem_id="llm-benchmark-tab-table", id=0):
|
100 |
leaderboard = init_leaderboard(LEADERBOARD_DF)
|
101 |
|
102 |
+
with gr.TabItem("π
N Correct", elem_id="llm-benchmark-tab-table", id=1):
|
103 |
leaderboard = init_leaderboard(LEADERBOARD_DF_N_CORRECT)
|
104 |
|
105 |
with gr.TabItem("π About", elem_id="llm-benchmark-tab-table-n-correct", id=2):
|
|
|
153 |
revision_name_textbox = gr.Textbox(label="Revision commit", placeholder="main")
|
154 |
output_format = gr.Textbox(label="Output format", placeholder="Out-GEN")
|
155 |
version = gr.Dropdown(
|
156 |
+
["1_correct", "1_correct_var", "n_correct",], value="1_correct", multiselect=False, label="Task version",
|
157 |
)
|
158 |
|
159 |
with gr.Row():
|