add captions to figures
Browse files
app.py
CHANGED
@@ -188,24 +188,28 @@ with demo:
|
|
188 |
with gr.TabItem("π
Hallucination Leaderboard", elem_id="llm-benchmark-tab-table", id=0):
|
189 |
# ---------- Chart ----------
|
190 |
with gr.Row():
|
191 |
-
gr.
|
192 |
-
|
193 |
-
|
194 |
-
|
195 |
-
|
196 |
-
|
197 |
-
|
198 |
-
|
199 |
-
|
200 |
-
|
201 |
-
|
202 |
-
|
203 |
-
|
204 |
-
|
205 |
-
|
206 |
-
|
207 |
-
|
208 |
-
|
|
|
|
|
|
|
|
|
209 |
|
210 |
# ---------- Leaderboard ----------
|
211 |
leaderboard = init_leaderboard(LEADERBOARD_DF)
|
|
|
188 |
with gr.TabItem("π
Hallucination Leaderboard", elem_id="llm-benchmark-tab-table", id=0):
|
189 |
# ---------- Chart ----------
|
190 |
with gr.Row():
|
191 |
+
with gr.Column():
|
192 |
+
gr.Plot(
|
193 |
+
make_leaderboard_plot(
|
194 |
+
LEADERBOARD_DF,
|
195 |
+
"RAG Hallucination Rate (%)",
|
196 |
+
"RAG Hallucination Rate (lower is better)",
|
197 |
+
bar_color="#4CAF50",
|
198 |
+
),
|
199 |
+
show_label=False,
|
200 |
+
)
|
201 |
+
gr.Markdown("*HaluEval-QA benchmark (RAG): The model receives a question plus supporting context. We report the % of answers that introduce facts not found in that context β lower is better. See the **Details** tab for more information.*", elem_classes="plot-caption")
|
202 |
+
with gr.Column():
|
203 |
+
gr.Plot(
|
204 |
+
make_leaderboard_plot(
|
205 |
+
LEADERBOARD_DF,
|
206 |
+
"Non-RAG Hallucination Rate (%)",
|
207 |
+
"Non-RAG Hallucination Rate (lower is better)",
|
208 |
+
bar_color="#FF7043",
|
209 |
+
),
|
210 |
+
show_label=False,
|
211 |
+
)
|
212 |
+
gr.Markdown("*UltraChat benchmark (~11 k prompts, non-RAG): Evaluates open-domain answers when only the question is given. Score is the % of hallucinated responses β lower is better. See the **Details** tab for more information.*", elem_classes="plot-caption")
|
213 |
|
214 |
# ---------- Leaderboard ----------
|
215 |
leaderboard = init_leaderboard(LEADERBOARD_DF)
|