File size: 958 Bytes
5f74261
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
import copy
from src.utils import clean_text, draw_ocr_bboxes
from src.model import run_example


def ocr_task(image):
    """
    Perform OCR (Optical Character Recognition) on the given image.

    Args:
        image (PIL.Image.Image): The input image to perform OCR on.

    Returns:
        tuple: A tuple containing the output image with OCR bounding boxes drawn and the cleaned OCR text.

    """

    # Task prompts
    ocr_prompt = "<OCR>"
    ocr_with_region_prompt = "<OCR_WITH_REGION>"

    # Get OCR text
    ocr_results = run_example(ocr_prompt, image)
    cleaned_text = clean_text(ocr_results["<OCR>"])

    # Get OCR with region
    ocr_with_region_results = run_example(ocr_with_region_prompt, image)
    output_image = copy.deepcopy(image)
    output_image = draw_ocr_bboxes(
        output_image, ocr_with_region_results["<OCR_WITH_REGION>"]
    )

    # Return the output image and cleaned OCR text
    return output_image, cleaned_text