Spaces:

Siyunb323
/

Two-phase_Fine-tuned_LLMs-CreativityAutoEvaluation

Sleeping

App Files Files Community

Siyunb323 commited on Dec 14, 2024

Commit

1d021ff

1 Parent(s): 2af82d9

change

Browse files

Files changed (1) hide show

app.py +83 -12

app.py CHANGED Viewed

@@ -1,5 +1,16 @@
 import gradio as gr
 import pandas as pd
 with open("./description.md", "r", encoding="utf-8") as file:
     description_text = file.read()
@@ -8,18 +19,78 @@ with open("./input_demo.txt", "r", encoding="utf-8") as file:
     demo = file.read()
 # 定义处理函数
-def process_data(task_name, model_name, pooling_method, input_text, file=None):
-    if file:
-        df = pd.read_csv(file.name)
-        output = f"Processed {len(df)} rows from uploaded file using task: {task_name}, model: {model_name}, pooling: {pooling_method}."
-        dataframe_output = df  # 返回数据框用于显示
-        file_output = df  # 输出文件框显示相同的数据
-    else:
-        lines = input_text.split("\n")
-        output = f"Processed {len(lines)} rows of text using task: {task_name}, model: {model_name}, pooling: {pooling_method}."
-        dataframe_output = pd.DataFrame({"Error": ["No file uploaded. DataFrame preview unavailable."]})  # 错误信息
-        file_output = pd.DataFrame()
     return output, dataframe_output, file_output
 ## 输入组件

+import os
 import gradio as gr
 import pandas as pd
+import tempfile
+def save_dataframe_to_file(dataframe, file_format="csv"):
+    temp_dir = tempfile.gettempdir()  # 获取系统临时目录
+    file_path = os.path.join(temp_dir, f"output.{file_format}")
+    if file_format == "csv":
+        dataframe.to_csv(file_path, index=False)
+    elif file_format == "xlsx":
+        dataframe.to_excel(file_path, index=False)
+    return file_path
 with open("./description.md", "r", encoding="utf-8") as file:
     description_text = file.read()
     demo = file.read()
 # 定义处理函数
+import pandas as pd
+def process_data(task_name, model_name, pooling_method, input_text=None, file=None):
+    output = ""
+    dataframe_output = pd.DataFrame()
+    file_output = pd.DataFrame()
+    # 情况 1: file 和 input_text 都为 None
+    if file is None and (input_text is None or input_text.strip() == ""):
+        output = "No valid input detected. Please check your input and ensure it follows the expected format."
+    # 情况 2: file 和 input_text 都不为 None
+    elif file is not None and input_text is not None:
+        output = "Detected both text and file input. Prioritizing file input."
+        # 检查文件类型
+        if not (file.name.endswith('.csv') or file.name.endswith('.xlsx')):
+            output += " File format must be xlsx or csv."
+        else:
+            # 读取文件
+            if file.name.endswith('.csv'):
+                df = pd.read_csv(file)
+            else:
+                df = pd.read_excel(file)
+            # 检查第一行是否为 "prompt" 和 "response"
+            if list(df.columns) == ['prompt', 'response']:
+                dataframe_output = df
+            else:
+                df_values = [list(df.columns)] + df.values.tolist()
+                dataframe_output = pd.DataFrame(df_values, columns=['prompt', 'response'])
+            file_output = save_dataframe_to_file(dataframe_output, file_format="csv")
+    # 情况 3: 只有 file
+    elif file is not None:
+        # 检查文件类型
+        if not (file.name.endswith('.csv') or file.name.endswith('.xlsx')):
+            output = "File format must be xlsx or csv."
+        else:
+            # 读取文件
+            if file.name.endswith('.csv'):
+                df = pd.read_csv(file)
+            else:
+                df = pd.read_excel(file)
+            # 检查第一行是否为 "prompt" 和 "response"
+            if list(df.columns) == ['prompt', 'response']:
+                dataframe_output = df
+            else:
+                df_values = [list(df.columns)] + df.values.tolist()
+                dataframe_output = pd.DataFrame(df_values, columns=['prompt', 'response'])
+            file_output = save_dataframe_to_file(dataframe_output, file_format="csv")
+            output = f"Processed {len(dataframe_output)} rows from uploaded file using task: {task_name}, model: {model_name}, pooling: {pooling_method}."
+    # 情况 4: 只有 input_text
+    elif input_text is not None:
+        lines = input_text.strip().split("\n")
+        rows = []
+        for line in lines:
+            try:
+                split_line = line.split(",", maxsplit=1)
+                if len(split_line) == 2:
+                    rows.append(split_line)
+            except Exception as e:
+                output = f"Error processing line: {line}"
+                break
+        if output == "":
+            if rows[0] == ['prompt', 'response']:
+                dataframe_output = pd.DataFrame(rows[1:], columns=['prompt', 'response'])
+            else:
+                dataframe_output = pd.DataFrame(rows, columns=['prompt', 'response'])
+            file_output = save_dataframe_to_file(dataframe_output, file_format="csv")
+            output = f"Processed {len(dataframe_output)} rows of text using task: {task_name}, model: {model_name}, pooling: {pooling_method}."
     return output, dataframe_output, file_output
 ## 输入组件