Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Edits.
Browse files- app.py +4 -0
- assets/{f1_performance.png → tier1_performance.png} +0 -0
- src/about.py +2 -2
app.py
CHANGED
@@ -302,6 +302,7 @@ with blocks:
|
|
302 |
gr.HTML(WHAT_IS_F1_HTML_EVAL_BEFORE_WARMUPFIG)
|
303 |
gr.Image(
|
304 |
"assets/warmup_performance.png",
|
|
|
305 |
show_label=False,
|
306 |
elem_classes=["f1-image"],
|
307 |
show_share_button=False,
|
@@ -316,6 +317,7 @@ with blocks:
|
|
316 |
# Tier 1 figure with corrected caption text
|
317 |
gr.Image(
|
318 |
"assets/tier1_performance.png",
|
|
|
319 |
show_label=False,
|
320 |
elem_classes=["f1-image"],
|
321 |
show_share_button=False,
|
@@ -351,6 +353,8 @@ with blocks:
|
|
351 |
with gr.Row():
|
352 |
gr.Markdown("# ✉️✨ Submit your solutions", elem_classes="markdown-text")
|
353 |
|
|
|
|
|
354 |
login_box = gr.Group(visible=True)
|
355 |
with login_box:
|
356 |
gr.Markdown("Please sign in with Hugging Face to submit")
|
|
|
302 |
gr.HTML(WHAT_IS_F1_HTML_EVAL_BEFORE_WARMUPFIG)
|
303 |
gr.Image(
|
304 |
"assets/warmup_performance.png",
|
305 |
+
width=600,
|
306 |
show_label=False,
|
307 |
elem_classes=["f1-image"],
|
308 |
show_share_button=False,
|
|
|
317 |
# Tier 1 figure with corrected caption text
|
318 |
gr.Image(
|
319 |
"assets/tier1_performance.png",
|
320 |
+
width=600,
|
321 |
show_label=False,
|
322 |
elem_classes=["f1-image"],
|
323 |
show_share_button=False,
|
|
|
353 |
with gr.Row():
|
354 |
gr.Markdown("# ✉️✨ Submit your solutions", elem_classes="markdown-text")
|
355 |
|
356 |
+
with gr.Row():
|
357 |
+
|
358 |
login_box = gr.Group(visible=True)
|
359 |
with login_box:
|
360 |
gr.Markdown("Please sign in with Hugging Face to submit")
|
assets/{f1_performance.png → tier1_performance.png}
RENAMED
File without changes
|
src/about.py
CHANGED
@@ -19,7 +19,7 @@ WHAT_IS_F1_HTML_TOP = f"""
|
|
19 |
<div class="f1-grid-table" role="table">
|
20 |
<div class="f1-grid-row f1-grid-head" role="row">
|
21 |
<div class="f1-grid-cell" role="columnheader">Category</div>
|
22 |
-
<div class="f1-grid-cell" role="columnheader">
|
23 |
<div class="f1-grid-cell" role="columnheader">Description</div>
|
24 |
</div>
|
25 |
<div class="f1-grid-row" role="row">
|
@@ -50,7 +50,7 @@ WHAT_IS_F1_HTML_BOTTOM_A = """
|
|
50 |
<div class="f1-container">
|
51 |
<section>
|
52 |
<p class="mb-4 f1-p">The latter category is incredibly demanding, requiring resolution of many points of uncertainty, and involving an array of reasoning steps, including topological and geometric insight, knowledge of mathematical domains such as extremal graph theory and logic, combinatorial considerations, precise implementation, and more.</p>
|
53 |
-
<p class="f1-p">Despite <a href="https://epoch.ai/frontiermath" target="_blank" rel="noopener noreferrer" class="f1-a">impressive</a> <a href="https://artificialanalysis.ai/evaluations/gpqa-diamond" target="_blank" rel="noopener noreferrer" class="f1-a">performance</a> on existing benchmarks, presently <strong>no model solves even a single
|
54 |
</section>
|
55 |
|
56 |
<section>
|
|
|
19 |
<div class="f1-grid-table" role="table">
|
20 |
<div class="f1-grid-row f1-grid-head" role="row">
|
21 |
<div class="f1-grid-cell" role="columnheader">Category</div>
|
22 |
+
<div class="f1-grid-cell" role="columnheader">Size</div>
|
23 |
<div class="f1-grid-cell" role="columnheader">Description</div>
|
24 |
</div>
|
25 |
<div class="f1-grid-row" role="row">
|
|
|
50 |
<div class="f1-container">
|
51 |
<section>
|
52 |
<p class="mb-4 f1-p">The latter category is incredibly demanding, requiring resolution of many points of uncertainty, and involving an array of reasoning steps, including topological and geometric insight, knowledge of mathematical domains such as extremal graph theory and logic, combinatorial considerations, precise implementation, and more.</p>
|
53 |
+
<p class="f1-p">Despite <a href="https://epoch.ai/frontiermath" target="_blank" rel="noopener noreferrer" class="f1-a">impressive</a> <a href="https://artificialanalysis.ai/evaluations/gpqa-diamond" target="_blank" rel="noopener noreferrer" class="f1-a">performance</a> on existing benchmarks, presently <strong>no model solves even a single Tier 2 problem</strong>.<sup><a href="#evaluation" class="f1-a">1</a></sup></p>
|
54 |
</section>
|
55 |
|
56 |
<section>
|