Update app.py
Browse files
app.py
CHANGED
@@ -39,7 +39,7 @@ def extract_pdf_text(file) -> str:
|
|
39 |
words = page.get_text("word")
|
40 |
full_text += words
|
41 |
|
42 |
-
print(full_text)
|
43 |
doc.close()
|
44 |
print(f"Total extracted text length: {len(full_text)} characters.")
|
45 |
return full_text
|
@@ -264,7 +264,7 @@ def highlight_issues_in_pdf(file, language_matches: List[Dict[str, Any]]) -> byt
|
|
264 |
abstract_offset = 0 if abstract_start == -1 else abstract_start
|
265 |
|
266 |
# Find "References" section and exclude from processing
|
267 |
-
references_start = concatenated_text.lower().
|
268 |
references_offset = len(concatenated_text) if references_start == -1 else references_start
|
269 |
|
270 |
# Iterate over each language issue
|
@@ -473,4 +473,3 @@ if __name__ == "__main__":
|
|
473 |
server_port=None
|
474 |
)
|
475 |
|
476 |
-
|
|
|
39 |
words = page.get_text("word")
|
40 |
full_text += words
|
41 |
|
42 |
+
# print(full_text)
|
43 |
doc.close()
|
44 |
print(f"Total extracted text length: {len(full_text)} characters.")
|
45 |
return full_text
|
|
|
264 |
abstract_offset = 0 if abstract_start == -1 else abstract_start
|
265 |
|
266 |
# Find "References" section and exclude from processing
|
267 |
+
references_start = concatenated_text.lower().rfind("references")
|
268 |
references_offset = len(concatenated_text) if references_start == -1 else references_start
|
269 |
|
270 |
# Iterate over each language issue
|
|
|
473 |
server_port=None
|
474 |
)
|
475 |
|
|