InternGPT

Running

InternGPT / iGPT /models /inpainting_src /ldm_inpainting /wrapper.py

laizeqiang

update

ee25e9d about 2 years ago

2.87 kB

	import os
	import sys

	import torch
	from omegaconf import OmegaConf
	import numpy as np

	from .ldm.models.diffusion.ddim import DDIMSampler
	from .ldm.util import instantiate_from_config

	CURRENT_DIR = os.path.dirname(os.path.abspath(__file__))
	sys.path.append(CURRENT_DIR)


	def make_batch(image, mask, device):
	image = image.astype(np.float32) / 255.0
	image = image[None].transpose(0, 3, 1, 2)
	image = torch.from_numpy(image)

	mask = mask.astype(np.float32) / 255.0
	mask = mask[None, None]
	mask[mask < 0.5] = 0
	mask[mask >= 0.5] = 1
	mask = torch.from_numpy(mask)

	masked_image = (1 - mask) * image

	batch = {"image": image, "mask": mask, "masked_image": masked_image}
	for k in batch:
	batch[k] = batch[k].to(device=device)
	batch[k] = batch[k] * 2.0 - 1.0
	return batch


	class LDMInpainter:
	def __init__(self, ckpt_path, ddim_steps=50):
	config = OmegaConf.load(os.path.join(CURRENT_DIR, "config.yaml"))
	model = instantiate_from_config(config.model)
	model.load_state_dict(torch.load(ckpt_path)["state_dict"], strict=False)
	self.model = model
	self.sampler = DDIMSampler(model)
	self.ddim_steps = ddim_steps

	@torch.no_grad()
	def __call__(self, image, mask, device):
	self.model.to(device)

	model = self.model
	sampler = self.sampler

	with self.model.ema_scope():
	batch = make_batch(image, mask, device=device)

	# encode masked image and concat downsampled mask
	c = model.cond_stage_model.encode(batch["masked_image"])
	cc = torch.nn.functional.interpolate(batch["mask"],
	size=c.shape[-2:])
	c = torch.cat((c, cc), dim=1)

	shape = (c.shape[1] - 1,) + c.shape[2:]
	samples_ddim, _ = sampler.sample(S=self.ddim_steps,
	conditioning=c,
	batch_size=c.shape[0],
	shape=shape,
	verbose=False)
	x_samples_ddim = model.decode_first_stage(samples_ddim)

	image = torch.clamp((batch["image"] + 1.0) / 2.0,
	min=0.0, max=1.0)
	mask = torch.clamp((batch["mask"] + 1.0) / 2.0,
	min=0.0, max=1.0)
	predicted_image = torch.clamp((x_samples_ddim + 1.0) / 2.0,
	min=0.0, max=1.0)

	inpainted = (1 - mask) * image + mask * predicted_image
	inpainted = inpainted.cpu().numpy().transpose(0, 2, 3, 1)[0] * 255

	# offload to cpu to save memory
	self.model.to(torch.device('cpu'))
	return inpainted.astype(np.uint8)