samyak152002 commited on
Commit
09c8002
·
verified ·
1 Parent(s): 364e0ba

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -3
app.py CHANGED
@@ -39,7 +39,7 @@ def extract_pdf_text(file) -> str:
39
  words = page.get_text("word")
40
  full_text += words
41
 
42
- print(full_text)
43
  doc.close()
44
  print(f"Total extracted text length: {len(full_text)} characters.")
45
  return full_text
@@ -264,7 +264,7 @@ def highlight_issues_in_pdf(file, language_matches: List[Dict[str, Any]]) -> byt
264
  abstract_offset = 0 if abstract_start == -1 else abstract_start
265
 
266
  # Find "References" section and exclude from processing
267
- references_start = concatenated_text.lower().find("references")
268
  references_offset = len(concatenated_text) if references_start == -1 else references_start
269
 
270
  # Iterate over each language issue
@@ -473,4 +473,3 @@ if __name__ == "__main__":
473
  server_port=None
474
  )
475
 
476
-
 
39
  words = page.get_text("word")
40
  full_text += words
41
 
42
+ # print(full_text)
43
  doc.close()
44
  print(f"Total extracted text length: {len(full_text)} characters.")
45
  return full_text
 
264
  abstract_offset = 0 if abstract_start == -1 else abstract_start
265
 
266
  # Find "References" section and exclude from processing
267
+ references_start = concatenated_text.lower().rfind("references")
268
  references_offset = len(concatenated_text) if references_start == -1 else references_start
269
 
270
  # Iterate over each language issue
 
473
  server_port=None
474
  )
475