Spaces:

Penality
/

pdf-something

Sleeping

Penality commited on Feb 25

Commit

5a8229c

verified ·

1 Parent(s): 01ba052

Update app.py

removed store_document call in extract_text_from_pdf

Files changed (1) hide show

app.py CHANGED Viewed

@@ -34,7 +34,6 @@ def store_document_data(PDF_FILE, METADATA_FILE, INDEX_FILE):
     if PDF_FILE:
         # Extract text from the PDF
-        print(PDF_FILE)
         text = extract_text_from_pdf(PDF_FILE)
         if not text:
             return "Could not extract any text from the PDF."
@@ -106,7 +105,6 @@ def extract_text_from_pdf(pdf_file):
     try:
         with pdfplumber.open(pdf_file) as pdf:
             text = " ".join(clean_text(text) for page in pdf.pages if (text := page.extract_text()))
-        store_document(text)
         return text
     except Exception as e:
         print(f"Error extracting text: {e}{pdf_file}")

     if PDF_FILE:
         # Extract text from the PDF
         text = extract_text_from_pdf(PDF_FILE)
         if not text:
             return "Could not extract any text from the PDF."
     try:
         with pdfplumber.open(pdf_file) as pdf:
             text = " ".join(clean_text(text) for page in pdf.pages if (text := page.extract_text()))
         return text
     except Exception as e:
         print(f"Error extracting text: {e}{pdf_file}")