Spaces:

hujiecpp
/

PE3R

Running on Zero

Jie Hu

init project

0bfe798 23 days ago

3.2 kB

	import numpy as np
	import torch
	from PIL import Image
	from modules.mobilesamv2.utils.transforms import ResizeLongestSide

	from modules.dust3r.utils.image import _resize_pil_image

	class Images:
	def __init__(self, filelist, device, size=512):

	self.pil_images = []
	self.pil_images_size = []
	self.np_images = []
	self.np_images_size = []
	# -- original images --
	tmp_images = []
	first_image_size = None
	all_images_same_size = True
	for img_path in filelist:
	pil_image = Image.open(img_path).convert("RGB")
	tmp_images.append(pil_image)

	current_image_size = pil_image.size
	if first_image_size is None:
	first_image_size = current_image_size
	else:
	if current_image_size != first_image_size:
	all_images_same_size = False

	for img in tmp_images:

	if not all_images_same_size:
	# resize long side to 512
	pil_image = _resize_pil_image(img, size)
	W, H = pil_image.size
	cx, cy = W//2, H//2
	halfw, halfh = ((2cx)//16)8, ((2cy)//16)8
	if W == H:
	halfh = 3*halfw/4
	pil_image = pil_image.crop((cx-halfw, cy-halfh, cx+halfw, cy+halfh))
	else:
	pil_image = img

	np_image = np.array(pil_image)

	height, width = pil_image.size
	np_shape = np_image.shape[:2]

	self.pil_images.append(pil_image)
	self.np_images.append(np_image)

	self.pil_images_size.append((height, width))
	self.np_images_size.append(np_shape)


	# -- sam2 images --
	img_mean = torch.tensor((0.485, 0.456, 0.406))[:, None, None]
	img_std = torch.tensor((0.229, 0.224, 0.225))[:, None, None]
	self.sam2_images = []
	# TODO
	self.sam2_video_size = (self.pil_images_size[0][1], self.pil_images_size[0][0])
	self.sam2_input_size = 512
	for pil_image in self.pil_images:
	np_image = np.array(pil_image.resize((self.sam2_input_size, self.sam2_input_size)))
	np_image = np_image / 255.0
	sam2_image = torch.from_numpy(np_image).permute(2, 0, 1)
	self.sam2_images.append(sam2_image)
	self.sam2_images = torch.stack(self.sam2_images)
	self.sam2_images -= img_mean
	self.sam2_images /= img_std
	self.sam2_images.to(device)

	# -- sam1 images --
	self.sam1_images = []
	self.sam1_images_size = []
	self.sam1_input_size = 1024
	self.sam1_transform = ResizeLongestSide(self.sam1_input_size)
	for np_image in self.np_images:
	sam1_image = self.sam1_transform.apply_image(np_image)
	sam1_image_torch = torch.as_tensor(sam1_image, device=device)
	transformed_image = sam1_image_torch.permute(2, 0, 1).contiguous()[None, :, :, :]

	self.sam1_images.append(transformed_image)
	self.sam1_images_size.append(tuple(transformed_image.shape[-2:]))