Update app.py
Browse files
app.py
CHANGED
@@ -44,7 +44,7 @@ def extract_pdf_text(file) -> str:
|
|
44 |
|
45 |
for page_number in range(len(doc)):
|
46 |
page = doc[page_number]
|
47 |
-
words = page.get_text("
|
48 |
full_text += words
|
49 |
print(f"Extracted {len(words)} characters from page {page_number+1}")
|
50 |
|
|
|
44 |
|
45 |
for page_number in range(len(doc)):
|
46 |
page = doc[page_number]
|
47 |
+
words = page.get_text("markdown") # Change to "text" instead of "word"
|
48 |
full_text += words
|
49 |
print(f"Extracted {len(words)} characters from page {page_number+1}")
|
50 |
|