Omar ID EL MOUMEN commited on
Commit
48f6066
·
1 Parent(s): 848b14f

Little fix

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -118,7 +118,7 @@ async def extract_pdf(pdf: PDF):
118
  pdf_req = requests.get(pdf.url)
119
  if pdf_req.status_code == 200:
120
  pdf_data = BytesIO(pdf_req.content)
121
- doc = fitz.open(stream=pdf_data, filetype="pdf")[:pdf.page_num]
122
  pdf_text = " ".join([page.get_text("text") for page in doc])
123
  pdf_metadata = doc.metadata
124
  print(pdf_metadata)
 
118
  pdf_req = requests.get(pdf.url)
119
  if pdf_req.status_code == 200:
120
  pdf_data = BytesIO(pdf_req.content)
121
+ doc = fitz.open(stream=pdf_data, filetype="pdf") if pdf.page_num == -1 else fitz.open(stream=pdf_data, filetype="pdf")[:pdf.page_num]
122
  pdf_text = " ".join([page.get_text("text") for page in doc])
123
  pdf_metadata = doc.metadata
124
  print(pdf_metadata)