insecta / khandy /draw_utils.py
admin
sync
67a9b5d
import numpy as np
import PIL
from PIL import Image
from PIL import ImageDraw
from PIL import ImageFont
from PIL import ImageColor
def _is_legal_color(color):
if color is None:
return True
if isinstance(color, str):
return True
return isinstance(color, (tuple, list)) and len(color) == 3
def _normalize_color(color, pil_mode, swap_rgb=False):
if color is None:
return color
if isinstance(color, str):
color = ImageColor.getrgb(color)
gray = color[0]
if swap_rgb:
color = (color[2], color[1], color[0])
if pil_mode == 'L':
color = gray
return color
def draw_text(image, text, position, color=(255,0,0), font=None, font_size=15):
"""Draws text on given image.
Args:
image (ndarray).
text (str): text to be drawn.
position (Tuple[int, int]): position where to be drawn.
color (List[Union[str, Tuple[int, int, int]]]): text color.
font (str): A filename or file-like object containing a TrueType font. If the file is not found in this
filename, the loader may also search in other directories, such as the `fonts/` directory on Windows
or `/Library/Fonts/`, `/System/Library/Fonts/` and `~/Library/Fonts/` on macOS.
font_size (int): The requested font size in points.
References:
torchvision.utils.draw_bounding_boxes
"""
if isinstance(image, np.ndarray):
# PIL.Image.fromarray fails with uint16 arrays
# https://github.com/python-pillow/Pillow/issues/1514
if (image.dtype == np.uint16) and (image.ndim != 2):
image = (image / 256).astype(np.uint8)
pil_image = Image.fromarray(image)
elif isinstance(image, PIL.Image.Image):
pil_image = image
else:
raise TypeError('Unsupported image type!')
assert pil_image.mode in ['L', 'RGB', 'RGBA']
assert _is_legal_color(color)
color = _normalize_color(color, pil_image.mode, isinstance(image, np.ndarray))
if font is None:
font_object = ImageFont.load_default()
else:
font_object = ImageFont.truetype(font, size=font_size)
draw = ImageDraw.Draw(pil_image)
draw.text((position[0], position[1]), text,
fill=color, font=font_object)
if isinstance(image, np.ndarray):
return np.asarray(pil_image)
return pil_image
def draw_bounding_boxes(image, boxes, labels=None, colors=None,
fill=False, width=1, font=None, font_size=15):
"""Draws bounding boxes on given image.
Args:
image (ndarray).
boxes (ndarray): ndarray of size (N, 4) containing bounding boxes in (xmin, ymin, xmax, ymax) format.
labels (List[str]): List containing the labels of bounding boxes.
colors (List[Union[str, Tuple[int, int, int]]]): List containing the colors of bounding boxes or labels.
fill (bool): If `True` fills the bounding box with specified color.
width (int): Width of bounding box.
font (str): A filename or file-like object containing a TrueType font. If the file is not found in this
filename, the loader may also search in other directories, such as the `fonts/` directory on Windows
or `/Library/Fonts/`, `/System/Library/Fonts/` and `~/Library/Fonts/` on macOS.
font_size (int): The requested font size in points.
References:
torchvision.utils.draw_bounding_boxes
"""
if isinstance(image, np.ndarray):
# PIL.Image.fromarray fails with uint16 arrays
# https://github.com/python-pillow/Pillow/issues/1514
if (image.dtype == np.uint16) and (image.ndim != 2):
image = (image / 256).astype(np.uint8)
pil_image = Image.fromarray(image)
elif isinstance(image, PIL.Image.Image):
pil_image = image
else:
raise TypeError('Unsupported image type!')
pil_image = pil_image.convert('RGB')
if font is None:
font_object = ImageFont.load_default()
else:
font_object = ImageFont.truetype(font, size=font_size)
if fill:
draw = ImageDraw.Draw(pil_image, "RGBA")
else:
draw = ImageDraw.Draw(pil_image)
for i, bbox in enumerate(boxes):
if colors is None:
color = None
else:
color = colors[i]
assert _is_legal_color(color)
color = _normalize_color(color, pil_image.mode, isinstance(image, np.ndarray))
if fill:
if color is None:
fill_color = (255, 255, 255, 100)
elif isinstance(color, str):
# This will automatically raise Error if rgb cannot be parsed.
fill_color = ImageColor.getrgb(color) + (100,)
elif isinstance(color, tuple):
fill_color = color + (100,)
# the first argument of ImageDraw.rectangle:
# in old version only supports [(x0, y0), (x1, y1)]
# in new version supports either [(x0, y0), (x1, y1)] or [x0, y0, x1, y1]
draw.rectangle([(bbox[0], bbox[1]), (bbox[2], bbox[3])], width=width, outline=color, fill=fill_color)
else:
draw.rectangle([(bbox[0], bbox[1]), (bbox[2], bbox[3])], width=width, outline=color)
if labels is not None:
margin = width + 1
draw.text((bbox[0] + margin, bbox[1] + margin), labels[i], fill=color, font=font_object)
if isinstance(image, np.ndarray):
return np.asarray(pil_image)
return pil_image