csv-generation-img

Sleeping

App Files Files Community

Nechba commited on Apr 11

Commit

4f8a713

verified ·

1 Parent(s): 26f42da

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -22

app.py CHANGED Viewed

@@ -12,7 +12,8 @@ from utils import (
     extract_csv_from_response,
     pdf_to_images,
     analyze_single_document,
-process_local_pdf
 )
 import base64
 from datetime import datetime
@@ -62,27 +63,7 @@ st.markdown("""
 st.title("📄 PDF Document Analyzer")
 st.markdown("Upload multiple PDFs to analyze each document directly using Gemini's native PDF processing")
-# Load prompt
-PROMPT  ="""Please analyze the provided images of the real estate document set and perform the following actions:
-1.  *Identify Parties:* Determine and list Seller 1, Seller 2 (if applicable), Buyer 1, and Buyer 2.
-2.  *Identify Missing Items:* Locate and list all instances of missing signatures and missing initials for all parties across all documents.
-3.  *Identify Checked Boxes:* Locate and list all checkboxes that have been marked or checked.
-4.  *Generate Secondary Questions:* For checkboxes that indicate significant waivers (e.g., home warranty, inspection rights, lead paint assessment), specific conditions (e.g., cash sale, contingency status), potential conflicts, or reference other documents, formulate a relevant 'Secondary Question' designed to prompt confirmation or clarification from the user/parties involved.
-5.  *Check for Required Paperwork:* Based only on the checkboxes identified in step 3 that explicitly state or strongly imply a specific addendum or disclosure document should be attached (e.g., "Lead Based Paint Disclosure Addendum attached", "See Counter Offer Addendum", "Seller's Disclosure...Addendum attached", "Retainer Addendum attached", etc.), check if a document matching that description appears to be present within the provided image set. Note whether this implied paperwork is 'Found', 'Missing', or 'Potentially Missing/Ambiguous' within the provided images.
-6.  *Identify Conflicts:* Specifically look for and note any directly contradictory information or conflicting checked boxes (like the conflicting inspection clauses found previously).
-7.  *Provide Location:* For every identified item (missing signature/initial, checked box, required paperwork status, party identification, conflict), specify the approximate line number(s) or clear location on the page (e.g., Bottom Right Initials, Seller Signature Block).
-8.  *Format Output:* Present all findings comprehensively in CSV format. The CSV columns should be:
-    *   Category (e.g., Parties, Missing Item, Checked Box, Required Paperwork, Conflict)
-    *   Location (Document Name/Page, e.g., Sale Contract Pg 2)
-    *   Line Item(s) (Approximate line number or location description)
-    *   Item Type (e.g., Seller Initials, Home Warranty Waiver, Lead Paint Addendum Check, Lead Paint Addendum Document)
-    *   Status (e.g., Identified, Missing, Checked, Found, Potentially Missing, Conflict Detected)
-    *   Details (Specifics like names, text of the checkbox, description of the issue or document status)
-    *   Secondary Question (if applicable) (The question generated in step 4)
-Please apply this analysis to the entire set of documents provided.
-"""
 # Sidebar Configuration
 with st.sidebar:
@@ -134,7 +115,7 @@ if uploaded_files and api_key:
                             # Analyze PDF directly
                              # Convert PDF to images
-                            df = process_local_pdf(uploaded_file.getvalue())
                             # Display results in expandable section
                             with st.expander("View Analysis Results", expanded=True):

     extract_csv_from_response,
     pdf_to_images,
     analyze_single_document,
+process_local_pdf,
+analyze_pdf_images_with_gemini
 )
 import base64
 from datetime import datetime
 st.title("📄 PDF Document Analyzer")
 st.markdown("Upload multiple PDFs to analyze each document directly using Gemini's native PDF processing")
 # Sidebar Configuration
 with st.sidebar:
                             # Analyze PDF directly
                              # Convert PDF to images
+                            df = analyze_pdf_images_with_gemini(uploaded_file.getvalue())
                             # Display results in expandable section
                             with st.expander("View Analysis Results", expanded=True):