logger1

Running

App Files Files Community

Sanjayraju30 commited on 9 days ago

Commit

52e7bf6

verified ·

1 Parent(s): 5d38db5

Update ocr_engine.py

Browse files

Files changed (1) hide show

ocr_engine.py +14 -14

ocr_engine.py CHANGED Viewed

@@ -2,31 +2,31 @@ from transformers import TrOCRProcessor, VisionEncoderDecoderModel
 from PIL import Image, ImageEnhance
 import re
-# Load processor + model
 processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-handwritten")
 model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-handwritten")
 def extract_weight(image: Image.Image) -> str:
-    # Crop only display region (adjust based on your image format)
-    width, height = image.size
-    display_area = image.crop((width * 0.35, height * 0.1, width * 0.65, height * 0.25))  # crop display center
-    # Enhance contrast & sharpness
-    display_area = display_area.convert("L")  # grayscale
-    display_area = ImageEnhance.Contrast(display_area).enhance(2.0)
-    display_area = ImageEnhance.Sharpness(display_area).enhance(2.5)
-    display_area = display_area.convert("RGB")
-    # OCR
-    pixel_values = processor(images=display_area, return_tensors="pt").pixel_values
     generated_ids = model.generate(pixel_values, max_length=32)
     full_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
-    # Clean & parse
     cleaned = full_text.lower().replace(" ", "")
     match = re.search(r"(\d+(\.\d+)?)", cleaned)
     weight = match.group(1) if match else None
     if any(u in cleaned for u in ["kg", "kgs", "kilogram", "kilo"]):
         unit = "kg"
     elif any(u in cleaned for u in ["g", "gram", "grams"]):
@@ -34,4 +34,4 @@ def extract_weight(image: Image.Image) -> str:
     else:
         unit = "kg" if weight and float(weight) >= 20 else "grams"
-    return f"{weight} {unit}" if weight else ""

 from PIL import Image, ImageEnhance
 import re
+# Load OCR model
 processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-handwritten")
 model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-handwritten")
 def extract_weight(image: Image.Image) -> str:
+    # Step 1: Enhance image
+    image = image.convert("L")  # grayscale
+    image = ImageEnhance.Contrast(image).enhance(2.0)
+    image = ImageEnhance.Sharpness(image).enhance(2.5)
+    image = image.convert("RGB")
+    # Step 2: Run OCR
+    pixel_values = processor(images=image, return_tensors="pt").pixel_values
     generated_ids = model.generate(pixel_values, max_length=32)
     full_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
+    # Debug
+    print("OCR Output:", full_text)
+    # Step 3: Extract number
     cleaned = full_text.lower().replace(" ", "")
     match = re.search(r"(\d+(\.\d+)?)", cleaned)
     weight = match.group(1) if match else None
+    # Step 4: Detect unit based on actual OCR text
     if any(u in cleaned for u in ["kg", "kgs", "kilogram", "kilo"]):
         unit = "kg"
     elif any(u in cleaned for u in ["g", "gram", "grams"]):
     else:
         unit = "kg" if weight and float(weight) >= 20 else "grams"
+    return f"{weight} {unit}" if weight else "No valid weight detected"