SearchGPT

Running

Shreyas094 commited on Jul 4, 2024

Commit

25c59df

verified ·

1 Parent(s): 13f7689

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-import io
 import os
 import json
 import gradio as gr
@@ -16,6 +16,9 @@ from langchain_core.runnables import RunnableParallel, RunnablePassthrough
 huggingface_token = os.environ.get("HUGGINGFACE_TOKEN")
 def load_and_split_document(file):
     """Loads and splits the document into pages."""
     loader = PyPDFLoader(file.name)
@@ -89,14 +92,12 @@ def extract_db_to_excel():
     data = [{"page_content": doc.page_content, "metadata": json.dumps(doc.metadata)} for doc in documents]
     df = pd.DataFrame(data)
-    # Save DataFrame to an in-memory Excel file
-    output = io.BytesIO()
-    with pd.ExcelWriter(output, engine='openpyxl') as writer:
-        df.to_excel(writer, index=False)
-    output.seek(0)
-    # Return the file data in a format Gradio can handle
-    return (output.getvalue(), "database_output.xlsx")
 # Modify the Gradio interface
 with gr.Blocks() as demo:

+import tempfile
 import os
 import json
 import gradio as gr
 huggingface_token = os.environ.get("HUGGINGFACE_TOKEN")
+# At the beginning of your script
+os.environ['TMPDIR'] = '/tmp'
 def load_and_split_document(file):
     """Loads and splits the document into pages."""
     loader = PyPDFLoader(file.name)
     data = [{"page_content": doc.page_content, "metadata": json.dumps(doc.metadata)} for doc in documents]
     df = pd.DataFrame(data)
+    # Create a temporary file
+    with tempfile.NamedTemporaryFile(delete=False, suffix='.xlsx') as tmp:
+        excel_path = tmp.name
+        df.to_excel(excel_path, index=False)
+    return excel_path
 # Modify the Gradio interface
 with gr.Blocks() as demo: