ootes
/

wwtbtest

Model card Files Files and versions Community

wwtbtest / stable_diffusion /scripts /inpaint.py

ootes's picture

Duplicate from ootes/wwtb

9437b5b over 1 year ago

history blame contribute delete

3.64 kB

	import argparse, os, sys, glob
	from omegaconf import OmegaConf
	from PIL import Image
	from tqdm import tqdm
	import numpy as np
	import torch
	from main import instantiate_from_config
	from ldm.models.diffusion.ddim import DDIMSampler


	def make_batch(image, mask, device):
	image = np.array(Image.open(image).convert("RGB"))
	image = image.astype(np.float32)/255.0
	image = image[None].transpose(0,3,1,2)
	image = torch.from_numpy(image)

	mask = np.array(Image.open(mask).convert("L"))
	mask = mask.astype(np.float32)/255.0
	mask = mask[None,None]
	mask[mask < 0.5] = 0
	mask[mask >= 0.5] = 1
	mask = torch.from_numpy(mask)

	masked_image = (1-mask)*image

	batch = {"image": image, "mask": mask, "masked_image": masked_image}
	for k in batch:
	batch[k] = batch[k].to(device=device)
	batch[k] = batch[k]*2.0-1.0
	return batch


	if __name__ == "__main__":
	parser = argparse.ArgumentParser()
	parser.add_argument(
	"--indir",
	type=str,
	nargs="?",
	help="dir containing image-mask pairs (`example.png` and `example_mask.png`)",
	)
	parser.add_argument(
	"--outdir",
	type=str,
	nargs="?",
	help="dir to write results to",
	)
	parser.add_argument(
	"--steps",
	type=int,
	default=50,
	help="number of ddim sampling steps",
	)
	opt = parser.parse_args()

	masks = sorted(glob.glob(os.path.join(opt.indir, "*_mask.png")))
	images = [x.replace("_mask.png", ".png") for x in masks]
	print(f"Found {len(masks)} inputs.")

	config = OmegaConf.load("models/ldm/inpainting_big/config.yaml")
	model = instantiate_from_config(config.model)
	model.load_state_dict(torch.load("models/ldm/inpainting_big/last.ckpt")["state_dict"],
	strict=False)

	device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")
	model = model.to(device)
	sampler = DDIMSampler(model)

	os.makedirs(opt.outdir, exist_ok=True)
	with torch.no_grad():
	with model.ema_scope():
	for image, mask in tqdm(zip(images, masks)):
	outpath = os.path.join(opt.outdir, os.path.split(image)[1])
	batch = make_batch(image, mask, device=device)

	# encode masked image and concat downsampled mask
	c = model.cond_stage_model.encode(batch["masked_image"])
	cc = torch.nn.functional.interpolate(batch["mask"],
	size=c.shape[-2:])
	c = torch.cat((c, cc), dim=1)

	shape = (c.shape[1]-1,)+c.shape[2:]
	samples_ddim, _ = sampler.sample(S=opt.steps,
	conditioning=c,
	batch_size=c.shape[0],
	shape=shape,
	verbose=False)
	x_samples_ddim = model.decode_first_stage(samples_ddim)

	image = torch.clamp((batch["image"]+1.0)/2.0,
	min=0.0, max=1.0)
	mask = torch.clamp((batch["mask"]+1.0)/2.0,
	min=0.0, max=1.0)
	predicted_image = torch.clamp((x_samples_ddim+1.0)/2.0,
	min=0.0, max=1.0)

	inpainted = (1-mask)image+maskpredicted_image
	inpainted = inpainted.cpu().numpy().transpose(0,2,3,1)[0]*255
	Image.fromarray(inpainted.astype(np.uint8)).save(outpath)