Spaces:

Arch10
/

OCR

Sleeping

Arch10 commited on Sep 26, 2024

Commit

42bde06

verified ·

1 Parent(s): c1ccc22

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,35 +1,41 @@
-import gradio as gr
 import easyocr
 import re
-from PIL import Image
-# Initialize EasyOCR Reader
 reader = easyocr.Reader(['en', 'hi'])
-# Function to extract text and search for a keyword
-def extract_and_search_text(image, keyword):
-    results = reader.readtext(image)
-    extracted_text = " ".join([text for (_, text, _) in results])
-    if not keyword:
-        return extracted_text, "Enter a keyword to search."
-    # Highlight the matching keyword
-    highlighted_text = re.sub(f"({keyword})", r"<mark>\1</mark>", extracted_text, flags=re.IGNORECASE)
-    if keyword.lower() in extracted_text.lower():
-        return extracted_text, highlighted_text
     else:
-        return extracted_text, "No matches found for the keyword."
-# Gradio interface with keyword input
-iface = gr.Interface(
-    fn=extract_and_search_text,
-    inputs=[gr.Image(type="pil"), gr.Textbox(label="Enter keyword")],
-    outputs=[gr.Textbox(label="Extracted Text"), gr.HTML(label="Search Results")],
-    title="Image Text Extraction and Keyword Search using EasyOCR",
-    description="Upload an image, extract the text, and search for a keyword within the extracted text."
 )
-# Launch the Gradio interface
-iface.launch()

 import easyocr
+import gradio as gr
 import re
+# Initialize EasyOCR reader
 reader = easyocr.Reader(['en', 'hi'])
+# Function for OCR and search functionality
+def process_image(image, keyword):
+    # Perform OCR on the image
+    result = reader.readtext(image, detail=0)
+    extracted_text = " ".join(result)
+    # Highlight the keyword in the extracted text
+    highlight_color = "#87CEEB"  # Soft Sky Blue
+    if keyword:
+        highlighted_text = re.sub(f"({re.escape(keyword)})",
+                                   f"<mark style='background-color: {highlight_color};'>{keyword}</mark>",
+                                   extracted_text,
+                                   flags=re.IGNORECASE)
+    else:
+        highlighted_text = extracted_text
+    # Check if the keyword is in the text
+    if keyword and keyword.lower() in extracted_text.lower():
+        return f"Keyword '{keyword}' found in the text.", highlighted_text
     else:
+        return f"Keyword '{keyword}' not found.", highlighted_text
+# Gradio interface
+interface = gr.Interface(
+    fn=process_image,
+    inputs=["image", "text"],
+    outputs=["text", "html"],
+    title="OCR and Document Search with Highlighting",
+    description="Upload an image, extract text, and search for keywords with highlighting."
 )
+# Launch the app
+if __name__ == "__main__":
+    interface.launch()