engrphoenix commited on
Commit
cfa3829
·
verified ·
1 Parent(s): 6b91033

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -4,16 +4,16 @@ from PyPDF2 import PdfReader
4
  import numpy as np
5
  from groq import Groq
6
  import faiss
7
-
8
  # Set up Groq API client
9
  groq_client = Groq(api_key="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")
10
 
11
  # Function to extract text from PDF
12
  def extract_pdf_content(pdf_file):
13
- reader = PdfReader(pdf_file)
14
  content = ""
15
- for page in reader.pages:
16
- content += page.extract_text()
17
  return content
18
 
19
  # Function to split content into chunks
 
4
  import numpy as np
5
  from groq import Groq
6
  import faiss
7
+ import fitz # PyMuPDF
8
  # Set up Groq API client
9
  groq_client = Groq(api_key="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")
10
 
11
  # Function to extract text from PDF
12
  def extract_pdf_content(pdf_file):
13
+ doc = fitz.open(pdf_file)
14
  content = ""
15
+ for page in doc:
16
+ content += page.get_text()
17
  return content
18
 
19
  # Function to split content into chunks