File size: 1,306 Bytes
2b3ce8d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
import fitz
from PIL import Image
from src.setting import LOCAL_TEST
import numpy as np
from src import logging


class PDF_Processing:
    def __init__(self):
        pass

    def pdf_to_image(file):
        """

        This function will take pdf file and convert first page into image and return it.



        LOCAL_TEST : True / False

        

        """

        try:
            if LOCAL_TEST:
                pdf_file = fitz.open(filename=file,filetype="pdf")
            else:
                pdf_file = fitz.open(stream=file.read(), filetype="pdf")

            page = pdf_file.load_page(0)
            pix = page.get_pixmap(matrix=fitz.Matrix(300/72, 300/72))  # 300 DPI
            image_bytes = pix.samples
            image = Image.frombytes("RGB", [pix.width, pix.height], image_bytes)
            image_np = np.array(image)

            return image_np
        except Exception as e:
            logging.info(f"Error {e} : pdf_to_image")

    def load_image(file):
        """

        This function take image and return numpy array

        """
        try:
            image = Image.open(file)
            image_np = np.array(image)
            return image_np
        except Exception as e:
            logging.info(f"Error {e} : load_image")