import copy from src.utils import clean_text, draw_ocr_bboxes from src.model import run_example def ocr_task(image): """ Perform OCR (Optical Character Recognition) on the given image. Args: image (PIL.Image.Image): The input image to perform OCR on. Returns: tuple: A tuple containing the output image with OCR bounding boxes drawn and the cleaned OCR text. """ # Task prompts ocr_prompt = "" ocr_with_region_prompt = "" # Get OCR text ocr_results = run_example(ocr_prompt, image) cleaned_text = clean_text(ocr_results[""]) # Get OCR with region ocr_with_region_results = run_example(ocr_with_region_prompt, image) output_image = copy.deepcopy(image) output_image = draw_ocr_bboxes( output_image, ocr_with_region_results[""] ) # Return the output image and cleaned OCR text return output_image, cleaned_text