Spaces:
Sleeping
Sleeping
File size: 1,306 Bytes
2b3ce8d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 |
import fitz
from PIL import Image
from src.setting import LOCAL_TEST
import numpy as np
from src import logging
class PDF_Processing:
def __init__(self):
pass
def pdf_to_image(file):
"""
This function will take pdf file and convert first page into image and return it.
LOCAL_TEST : True / False
"""
try:
if LOCAL_TEST:
pdf_file = fitz.open(filename=file,filetype="pdf")
else:
pdf_file = fitz.open(stream=file.read(), filetype="pdf")
page = pdf_file.load_page(0)
pix = page.get_pixmap(matrix=fitz.Matrix(300/72, 300/72)) # 300 DPI
image_bytes = pix.samples
image = Image.frombytes("RGB", [pix.width, pix.height], image_bytes)
image_np = np.array(image)
return image_np
except Exception as e:
logging.info(f"Error {e} : pdf_to_image")
def load_image(file):
"""
This function take image and return numpy array
"""
try:
image = Image.open(file)
image_np = np.array(image)
return image_np
except Exception as e:
logging.info(f"Error {e} : load_image")
|