Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -1800,8 +1800,10 @@ with gr.Blocks(theme='shivi/calm_seafoam', css_paths='style.css', js=js_func) as
|
|
1800 |
df = calculate_average_metrics(df, selected_metrics)
|
1801 |
|
1802 |
if flag_TQA:
|
1803 |
-
df["target_answer"] = df["target_answer"]
|
1804 |
-
|
|
|
|
|
1805 |
worst_cases_df = df.groupby(['model', 'tbl_name', 'test_category', 'question', 'target_answer', 'predicted_answer', 'answer', 'sql_tag'])['avg_metric'].mean().reset_index()
|
1806 |
else:
|
1807 |
worst_cases_df = df.groupby(['model', 'tbl_name', 'test_category', 'question', 'query', 'predicted_sql', 'answer', 'sql_tag'])['avg_metric'].mean().reset_index()
|
|
|
1800 |
df = calculate_average_metrics(df, selected_metrics)
|
1801 |
|
1802 |
if flag_TQA:
|
1803 |
+
df["target_answer"] = df["target_answer"].apply(
|
1804 |
+
lambda x: "[" + ", ".join(map(str, x)) + "]" if isinstance(x, (list, tuple))
|
1805 |
+
else ("[]" if pd.isna(x) else str(x))
|
1806 |
+
)
|
1807 |
worst_cases_df = df.groupby(['model', 'tbl_name', 'test_category', 'question', 'target_answer', 'predicted_answer', 'answer', 'sql_tag'])['avg_metric'].mean().reset_index()
|
1808 |
else:
|
1809 |
worst_cases_df = df.groupby(['model', 'tbl_name', 'test_category', 'question', 'query', 'predicted_sql', 'answer', 'sql_tag'])['avg_metric'].mean().reset_index()
|