Spaces:

rijdev
/

OCR

Sleeping

App Files Files Community

rijdev commited on Jun 13

Commit

df43f0a

verified ·

1 Parent(s): 65a8134

Update

Browse files

Files changed (1) hide show

app.py +15 -16

app.py CHANGED Viewed

@@ -4,56 +4,55 @@ from PIL import Image
 import os
 import re
-# Load OCR model
 processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-stage1")
 model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-stage1")
-# Folder to store extracted records
 PATIENT_RECORDS_DIR = "records"
 os.makedirs(PATIENT_RECORDS_DIR, exist_ok=True)
 # Extract patient name from filename
 def extract_patient_name(file_name):
-    # Example: JuanDelaCruz_2025-06-13.png → JuanDelaCruz
     match = re.match(r"([A-Za-z]+[A-Za-z]*)_.*\.(jpg|jpeg|png)$", file_name)
     return match.group(1) if match else None
 # OCR logic
-def perform_ocr(image_file):
-    image = Image.open(image_file).convert("RGB")
     pixel_values = processor(images=image, return_tensors="pt").pixel_values
     generated_ids = model.generate(pixel_values)
     text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0].strip()
     return text
-# Save to patient record file
 def save_record(patient_name, ocr_text):
     file_path = os.path.join(PATIENT_RECORDS_DIR, f"{patient_name}_records.txt")
     with open(file_path, "a") as f:
         f.write("\n\n===== New Lab Result =====\n")
         f.write(ocr_text)
-# Gradio function
-def process_lab_result(image):
-    file_name = os.path.basename(image.name)
     patient_name = extract_patient_name(file_name)
     if not patient_name:
-        return "❌ Cannot extract patient name from filename. Please name the file like JuanDelaCruz_2025-06-13.png"
-    ocr_text = perform_ocr(image)
     save_record(patient_name, ocr_text)
-    return f"✅ OCR completed. Lab result saved to `{patient_name}_records.txt`.\n\n---\n📄 Extracted Text:\n{ocr_text}"
 # Gradio interface
 iface = gr.Interface(
     fn=process_lab_result,
-    inputs=gr.File(label="Upload Lab Result Image (.png, .jpg)", type="file"),
     outputs="text",
-    title="🩺 Lab Result OCR with Patient Linking",
-    description="Upload a lab result image named like `JuanDelaCruz_2025-06-13.png`. The system will extract the text and save it to the patient's record."
 )
 if __name__ == "__main__":
-    iface.launch()

 import os
 import re
+# Load Hugging Face OCR model
 processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-stage1")
 model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-stage1")
+# Folder to store extracted patient records
 PATIENT_RECORDS_DIR = "records"
 os.makedirs(PATIENT_RECORDS_DIR, exist_ok=True)
 # Extract patient name from filename
 def extract_patient_name(file_name):
     match = re.match(r"([A-Za-z]+[A-Za-z]*)_.*\.(jpg|jpeg|png)$", file_name)
     return match.group(1) if match else None
 # OCR logic
+def perform_ocr(image_path):
+    image = Image.open(image_path).convert("RGB")
     pixel_values = processor(images=image, return_tensors="pt").pixel_values
     generated_ids = model.generate(pixel_values)
     text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0].strip()
     return text
+# Save to patient record
 def save_record(patient_name, ocr_text):
     file_path = os.path.join(PATIENT_RECORDS_DIR, f"{patient_name}_records.txt")
     with open(file_path, "a") as f:
         f.write("\n\n===== New Lab Result =====\n")
         f.write(ocr_text)
+# Main Gradio handler
+def process_lab_result(image_path):
+    file_name = os.path.basename(image_path)
     patient_name = extract_patient_name(file_name)
     if not patient_name:
+        return "❌ Cannot extract patient name from filename. Use format: JuanDelaCruz_2025-06-13.jpg"
+    ocr_text = perform_ocr(image_path)
     save_record(patient_name, ocr_text)
+    return f"✅ OCR completed. Lab result saved for `{patient_name}`.\n\n📄 Extracted Text:\n\n{ocr_text}"
 # Gradio interface
 iface = gr.Interface(
     fn=process_lab_result,
+    inputs=gr.File(label="Upload Lab Result (.jpg/.png)", type="filepath"),
     outputs="text",
+    title="🩺 Lab Result OCR",
+    description="Upload a lab result image named like `JuanDelaCruz_2025-06-13.jpg`. The text will be extracted and saved to the patient's record."
 )
 if __name__ == "__main__":
+    iface.launch()