farimafatahi commited on
Commit
347446d
·
verified ·
1 Parent(s): 2c11405

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +0 -21
app.py CHANGED
@@ -138,13 +138,6 @@ with tab1:
138
  <th>Rank</th>
139
  <th>Model</th>
140
  <th>Factuality Score</th>
141
- <th>Factual Recall</th>
142
- <th>Conceptual Understanding</th>
143
- <th>Procedural Execution</th>
144
- <th>Comparative Analysis</th>
145
- <th>Recommendations and Insights</th>
146
- <th>Domain-Specific Knowledge</th>
147
- <th>Temporal Context</th>
148
  <th>Hallucination Score</th>
149
  <th># Tokens</th>
150
  <th># Factual</th>
@@ -162,13 +155,6 @@ with tab1:
162
  <th>Rank</th>
163
  <th>Model</th>
164
  <th>Factuality Score</th>
165
- <th>Factual Recall</th>
166
- <th>Conceptual Understanding</th>
167
- <th>Procedural Execution</th>
168
- <th>Comparative Analysis</th>
169
- <th>Recommendations and Insights</th>
170
- <th>Domain-Specific Knowledge</th>
171
- <th>Temporal Context</th>
172
  <th>Hallucination Score</th>
173
  <th># Tokens</th>
174
  <th># Factual</th>
@@ -195,13 +181,6 @@ with tab1:
195
  <td>{row['rank']}</td>
196
  <td>{row['model']}</td>
197
  <td>{row['factuality_score']}</td>
198
- <td>{row['prompt_categories.Factual Recall']}</td>
199
- <td>{row['prompt_categories.Conceptual Understanding']}</td>
200
- <td>{row['prompt_categories.Procedural Execution']}</td>
201
- <td>{row['prompt_categories.Comparative Analysis']}</td>
202
- <td>{row['prompt_categories.Recommendations and Insights']}</td>
203
- <td>{row['prompt_categories.Domain-Specific Knowledge']}</td>
204
- <td>{row['prompt_categories.Temporal Context']}</td>
205
  <td>{row['hallucination_score']}</td>
206
  <td>{row['avg_tokens']}</td>
207
  <td>{row['avg_factual_units']}</td>
 
138
  <th>Rank</th>
139
  <th>Model</th>
140
  <th>Factuality Score</th>
 
 
 
 
 
 
 
141
  <th>Hallucination Score</th>
142
  <th># Tokens</th>
143
  <th># Factual</th>
 
155
  <th>Rank</th>
156
  <th>Model</th>
157
  <th>Factuality Score</th>
 
 
 
 
 
 
 
158
  <th>Hallucination Score</th>
159
  <th># Tokens</th>
160
  <th># Factual</th>
 
181
  <td>{row['rank']}</td>
182
  <td>{row['model']}</td>
183
  <td>{row['factuality_score']}</td>
 
 
 
 
 
 
 
184
  <td>{row['hallucination_score']}</td>
185
  <td>{row['avg_tokens']}</td>
186
  <td>{row['avg_factual_units']}</td>