rymc commited on
Commit
a9d1818
Β·
verified Β·
1 Parent(s): 676fa45

add captions to figures

Browse files
Files changed (1) hide show
  1. app.py +22 -18
app.py CHANGED
@@ -188,24 +188,28 @@ with demo:
188
  with gr.TabItem("πŸ… Hallucination Leaderboard", elem_id="llm-benchmark-tab-table", id=0):
189
  # ---------- Chart ----------
190
  with gr.Row():
191
- gr.Plot(
192
- make_leaderboard_plot(
193
- LEADERBOARD_DF,
194
- "RAG Hallucination Rate (%)",
195
- "RAG Hallucination Rate (lower is better)",
196
- bar_color="#4CAF50",
197
- ),
198
- show_label=False,
199
- )
200
- gr.Plot(
201
- make_leaderboard_plot(
202
- LEADERBOARD_DF,
203
- "Non-RAG Hallucination Rate (%)",
204
- "Non-RAG Hallucination Rate (lower is better)",
205
- bar_color="#FF7043",
206
- ),
207
- show_label=False,
208
- )
 
 
 
 
209
 
210
  # ---------- Leaderboard ----------
211
  leaderboard = init_leaderboard(LEADERBOARD_DF)
 
188
  with gr.TabItem("πŸ… Hallucination Leaderboard", elem_id="llm-benchmark-tab-table", id=0):
189
  # ---------- Chart ----------
190
  with gr.Row():
191
+ with gr.Column():
192
+ gr.Plot(
193
+ make_leaderboard_plot(
194
+ LEADERBOARD_DF,
195
+ "RAG Hallucination Rate (%)",
196
+ "RAG Hallucination Rate (lower is better)",
197
+ bar_color="#4CAF50",
198
+ ),
199
+ show_label=False,
200
+ )
201
+ gr.Markdown("*HaluEval-QA benchmark (RAG): The model receives a question plus supporting context. We report the % of answers that introduce facts not found in that context β€” lower is better. See the **Details** tab for more information.*", elem_classes="plot-caption")
202
+ with gr.Column():
203
+ gr.Plot(
204
+ make_leaderboard_plot(
205
+ LEADERBOARD_DF,
206
+ "Non-RAG Hallucination Rate (%)",
207
+ "Non-RAG Hallucination Rate (lower is better)",
208
+ bar_color="#FF7043",
209
+ ),
210
+ show_label=False,
211
+ )
212
+ gr.Markdown("*UltraChat benchmark (~11 k prompts, non-RAG): Evaluates open-domain answers when only the question is given. Score is the % of hallucinated responses β€” lower is better. See the **Details** tab for more information.*", elem_classes="plot-caption")
213
 
214
  # ---------- Leaderboard ----------
215
  leaderboard = init_leaderboard(LEADERBOARD_DF)