Spaces:

OpenGVLab
/

InternGPT

Running

App Files Files Community

InternGPT / iGPT /models /inpainting_src /ldm_inpainting /wrapper.py

laizeqiang

update

ee25e9d over 1 year ago

raw

history blame contribute delete

No virus

2.87 kB

	import os
	import sys

	import torch
	from omegaconf import OmegaConf
	import numpy as np

	from .ldm.models.diffusion.ddim import DDIMSampler
	from .ldm.util import instantiate_from_config

	CURRENT_DIR = os.path.dirname(os.path.abspath(__file__))
	sys.path.append(CURRENT_DIR)


	def make_batch(image, mask, device):
	image = image.astype(np.float32) / 255.0
	image = image[None].transpose(0, 3, 1, 2)
	image = torch.from_numpy(image)

	mask = mask.astype(np.float32) / 255.0
	mask = mask[None, None]
	mask[mask < 0.5] = 0
	mask[mask >= 0.5] = 1
	mask = torch.from_numpy(mask)

	masked_image = (1 - mask) * image

	batch = {"image": image, "mask": mask, "masked_image": masked_image}
	for k in batch:
	batch[k] = batch[k].to(device=device)
	batch[k] = batch[k] * 2.0 - 1.0
	return batch


	class LDMInpainter:
	def __init__(self, ckpt_path, ddim_steps=50):
	config = OmegaConf.load(os.path.join(CURRENT_DIR, "config.yaml"))
	model = instantiate_from_config(config.model)
	model.load_state_dict(torch.load(ckpt_path)["state_dict"], strict=False)
	self.model = model
	self.sampler = DDIMSampler(model)
	self.ddim_steps = ddim_steps

	@torch.no_grad()
	def __call__(self, image, mask, device):
	self.model.to(device)

	model = self.model
	sampler = self.sampler

	with self.model.ema_scope():
	batch = make_batch(image, mask, device=device)

	# encode masked image and concat downsampled mask
	c = model.cond_stage_model.encode(batch["masked_image"])
	cc = torch.nn.functional.interpolate(batch["mask"],
	size=c.shape[-2:])
	c = torch.cat((c, cc), dim=1)

	shape = (c.shape[1] - 1,) + c.shape[2:]
	samples_ddim, _ = sampler.sample(S=self.ddim_steps,
	conditioning=c,
	batch_size=c.shape[0],
	shape=shape,
	verbose=False)
	x_samples_ddim = model.decode_first_stage(samples_ddim)

	image = torch.clamp((batch["image"] + 1.0) / 2.0,
	min=0.0, max=1.0)
	mask = torch.clamp((batch["mask"] + 1.0) / 2.0,
	min=0.0, max=1.0)
	predicted_image = torch.clamp((x_samples_ddim + 1.0) / 2.0,
	min=0.0, max=1.0)

	inpainted = (1 - mask) * image + mask * predicted_image
	inpainted = inpainted.cpu().numpy().transpose(0, 2, 3, 1)[0] * 255

	# offload to cpu to save memory
	self.model.to(torch.device('cpu'))
	return inpainted.astype(np.uint8)