Spaces:

Sanjayraju30
/

Autoweight

Build error

App Files Files Community

Sanjayraju30 commited on Jun 7

Commit

b902588

verified ·

1 Parent(s): d07963e

Update ocr_engine.py

Browse files

Files changed (1) hide show

ocr_engine.py +20 -23

ocr_engine.py CHANGED Viewed

@@ -1,55 +1,52 @@
-import numpy as np
 import re
 import cv2
 from PIL import Image
-import easyocr
-# ✅ Initialize EasyOCR Reader once
-reader = easyocr.Reader(['en'], gpu=False)
 def preprocess_image(image):
     """
-    Convert to grayscale and apply adaptive thresholding
-    to enhance contrast for digital scale OCR.
     """
     gray = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
-    thresh = cv2.adaptiveThreshold(
         gray, 255,
-        cv2.ADAPTIVE_THRESH_MEAN_C,
         cv2.THRESH_BINARY_INV,
-        11, 10
     )
-    return thresh
 def extract_weight_from_image(pil_image):
     try:
-        # ✅ Convert PIL image to OpenCV format
         image = np.array(pil_image.convert("RGB"))
         # ✅ Preprocess image
         processed = preprocess_image(image)
-        # ✅ Optional: Save debug image for troubleshooting
         debug_path = "debug_processed_image.png"
         Image.fromarray(processed).save(debug_path)
-        print(f"[DEBUG] Preprocessed image saved to: {debug_path}")
-        # ✅ Perform OCR using EasyOCR
-        result = reader.readtext(processed)
-        print("🔍 OCR Results:")
-        for detection in result:
-            print(f"  • Text: '{detection[1]}' | Confidence: {detection[2]*100:.2f}%")
-        # ✅ Extract first matching numeric value
-        for detection in result:
-            text = detection[1].replace(",", ".")  # normalize decimal
-            conf = detection[2]
             match = re.search(r"\b\d{1,4}(\.\d{1,2})?\b", text)
             if match:
                 return match.group(), round(conf * 100, 2)
-        # ❌ No weight found
         return "No weight detected", 0.0
     except Exception as e:

 import re
 import cv2
+import numpy as np
 from PIL import Image
+from paddleocr import PaddleOCR
+# ✅ Initialize PaddleOCR once
+ocr = PaddleOCR(use_angle_cls=False, lang='en', show_log=False)
 def preprocess_image(image):
     """
+    Convert to grayscale and enhance contrast to help OCR.
     """
     gray = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
+    processed = cv2.adaptiveThreshold(
         gray, 255,
+        cv2.ADAPTIVE_THRESH_GAUSSIAN_C,
         cv2.THRESH_BINARY_INV,
+        11, 2
     )
+    return processed
 def extract_weight_from_image(pil_image):
     try:
+        # ✅ Convert to OpenCV format
         image = np.array(pil_image.convert("RGB"))
         # ✅ Preprocess image
         processed = preprocess_image(image)
+        # Optional: Save debug image
         debug_path = "debug_processed_image.png"
         Image.fromarray(processed).save(debug_path)
+        print(f"[DEBUG] Saved preprocessed image to {debug_path}")
+        # ✅ Run OCR on original (RGB) image (not preprocessed)
+        result = ocr.ocr(image, cls=False)
+        print("🔍 PaddleOCR Results:")
+        for line in result[0]:
+            text = line[1][0]
+            conf = line[1][1]
+            print(f"  • Text: '{text}' | Confidence: {conf*100:.2f}%")
+            # Try to extract number like 53.25 or 100
             match = re.search(r"\b\d{1,4}(\.\d{1,2})?\b", text)
             if match:
                 return match.group(), round(conf * 100, 2)
         return "No weight detected", 0.0
     except Exception as e: