samyak152002 commited on
Commit
2859d26
·
verified ·
1 Parent(s): 2ad4c58

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -44,7 +44,7 @@ def extract_pdf_text(file) -> str:
44
 
45
  for page_number in range(len(doc)):
46
  page = doc[page_number]
47
- words = page.get_text("word") # Change to "text" instead of "word"
48
  full_text += words
49
  print(f"Extracted {len(words)} characters from page {page_number+1}")
50
 
 
44
 
45
  for page_number in range(len(doc)):
46
  page = doc[page_number]
47
+ words = page.get_text("markdown") # Change to "text" instead of "word"
48
  full_text += words
49
  print(f"Extracted {len(words)} characters from page {page_number+1}")
50