Spaces:

samyak152002
/

texmetrics-regex-checks-gradio-1

Running

samyak152002 commited on Dec 7, 2024

Commit

4bb46a1

verified ·

1 Parent(s): c85e0b2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -263,10 +263,18 @@ def highlight_issues_in_pdf(file, language_matches: List[Dict[str, Any]]) -> byt
         concatenated_text = " ".join([w[1] for w in word_list])
         # print(f"Concatenated text length: {concatenated_text} characters.")
         # Iterate over each language issue
         for idx, issue in enumerate(language_matches, start=1):
             offset = issue["offset"]  # offset+line_no-1
             length = issue["length"]
             error_text = concatenated_text[offset:offset+length+1]
@@ -327,6 +335,9 @@ def highlight_issues_in_pdf(file, language_matches: List[Dict[str, Any]]) -> byt
         print(f"Error in highlighting PDF: {e}")
         return b""
 # ------------------------------
 # Main Analysis Function
 # ------------------------------

         concatenated_text = " ".join([w[1] for w in word_list])
         # print(f"Concatenated text length: {concatenated_text} characters.")
+        # Find "References" section and exclude from processing
+        references_start = concatenated_text.lower().find("references")
+        references_offset = len(concatenated_text) if references_start == -1 else references_start
         # Iterate over each language issue
         for idx, issue in enumerate(language_matches, start=1):
             offset = issue["offset"]  # offset+line_no-1
             length = issue["length"]
+            # Skip issues in the references section
+            if offset >= references_offset:
+                continue
             error_text = concatenated_text[offset:offset+length+1]
         print(f"Error in highlighting PDF: {e}")
         return b""
 # ------------------------------
 # Main Analysis Function
 # ------------------------------