Spaces:

mdasad3617
/

lab-report-analyzer

Running

mdasad3617 commited on Dec 1, 2024

Commit

4d72778

verified ·

1 Parent(s): 08d36af

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,7 +2,7 @@ import streamlit as st
 from transformers import pipeline
 import pdfplumber
 from PIL import Image
-import pytesseract
 from langdetect import detect
 # Initialize Models
@@ -27,11 +27,12 @@ def extract_text_from_pdf(pdf_file):
             text += page.extract_text()
     return text.strip()
-# Extract text from Image
 def extract_text_from_image(image_file):
     image = Image.open(image_file)
-    text = pytesseract.image_to_string(image)
-    return text.strip()
 # Check if content is a lab report
 def is_lab_report(text, model):

 from transformers import pipeline
 import pdfplumber
 from PIL import Image
+import easyocr
 from langdetect import detect
 # Initialize Models
             text += page.extract_text()
     return text.strip()
+# Extract text from Image using EasyOCR
 def extract_text_from_image(image_file):
+    reader = easyocr.Reader(['en'])  # Add more languages if needed
     image = Image.open(image_file)
+    result = reader.readtext(image, detail=0)  # `detail=0` returns only the text
+    return " ".join(result).strip()
 # Check if content is a lab report
 def is_lab_report(text, model):