ColossalAI/examples/images/diffusion/scripts/inpaint.py

import argparse
import glob
import os

import numpy as np
import torch
from ldm.models.diffusion.ddim import DDIMSampler
from main import instantiate_from_config
from omegaconf import OmegaConf
from PIL import Image
from tqdm import tqdm


def make_batch(image, mask, device):
    image = np.array(Image.open(image).convert("RGB"))
    image = image.astype(np.float32) / 255.0
    image = image[None].transpose(0, 3, 1, 2)
    image = torch.from_numpy(image)

    mask = np.array(Image.open(mask).convert("L"))
    mask = mask.astype(np.float32) / 255.0
    mask = mask[None, None]
    mask[mask < 0.5] = 0
    mask[mask >= 0.5] = 1
    mask = torch.from_numpy(mask)

    masked_image = (1 - mask) * image

    batch = {"image": image, "mask": mask, "masked_image": masked_image}
    for k in batch:
        batch[k] = batch[k].to(device=device)
        batch[k] = batch[k] * 2.0 - 1.0
    return batch


if __name__ == "__main__":
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "--indir",
        type=str,
        nargs="?",
        help="dir containing image-mask pairs (`example.png` and `example_mask.png`)",
    )
    parser.add_argument(
        "--outdir",
        type=str,
        nargs="?",
        help="dir to write results to",
    )
    parser.add_argument(
        "--steps",
        type=int,
        default=50,
        help="number of ddim sampling steps",
    )
    opt = parser.parse_args()

    masks = sorted(glob.glob(os.path.join(opt.indir, "*_mask.png")))
    images = [x.replace("_mask.png", ".png") for x in masks]
    print(f"Found {len(masks)} inputs.")

    config = OmegaConf.load("models/ldm/inpainting_big/config.yaml")
    model = instantiate_from_config(config.model)
    model.load_state_dict(torch.load("models/ldm/inpainting_big/last.ckpt")["state_dict"], strict=False)

    device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")
    model = model.to(device)
    sampler = DDIMSampler(model)

    os.makedirs(opt.outdir, exist_ok=True)
    with torch.no_grad():
        with model.ema_scope():
            for image, mask in tqdm(zip(images, masks)):
                outpath = os.path.join(opt.outdir, os.path.split(image)[1])
                batch = make_batch(image, mask, device=device)

                # encode masked image and concat downsampled mask
                c = model.cond_stage_model.encode(batch["masked_image"])
                cc = torch.nn.functional.interpolate(batch["mask"], size=c.shape[-2:])
                c = torch.cat((c, cc), dim=1)

                shape = (c.shape[1] - 1,) + c.shape[2:]
                samples_ddim, _ = sampler.sample(
                    S=opt.steps, conditioning=c, batch_size=c.shape[0], shape=shape, verbose=False
                )
                x_samples_ddim = model.decode_first_stage(samples_ddim)

                image = torch.clamp((batch["image"] + 1.0) / 2.0, min=0.0, max=1.0)
                mask = torch.clamp((batch["mask"] + 1.0) / 2.0, min=0.0, max=1.0)
                predicted_image = torch.clamp((x_samples_ddim + 1.0) / 2.0, min=0.0, max=1.0)

                inpainted = (1 - mask) * image + mask * predicted_image
                inpainted = inpainted.cpu().numpy().transpose(0, 2, 3, 1)[0] * 255
                Image.fromarray(inpainted.astype(np.uint8)).save(outpath)
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`import argparse`
			`import glob`
			`import os`

[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00			`import numpy as np`
			`import torch`
			`from ldm.models.diffusion.ddim import DDIMSampler`
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`from main import instantiate_from_config`
			`from omegaconf import OmegaConf`
			`from PIL import Image`
			`from tqdm import tqdm`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00

			`def make_batch(image, mask, device):`
			`image = np.array(Image.open(image).convert("RGB"))`
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`image = image.astype(np.float32) / 255.0`
			`image = image[None].transpose(0, 3, 1, 2)`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00			`image = torch.from_numpy(image)`

			`mask = np.array(Image.open(mask).convert("L"))`
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`mask = mask.astype(np.float32) / 255.0`
			`mask = mask[None, None]`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00			`mask[mask < 0.5] = 0`
			`mask[mask >= 0.5] = 1`
			`mask = torch.from_numpy(mask)`

[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`masked_image = (1 - mask) * image`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00
			`batch = {"image": image, "mask": mask, "masked_image": masked_image}`
			`for k in batch:`
			`batch[k] = batch[k].to(device=device)`
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`batch[k] = batch[k] * 2.0 - 1.0`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00			`return batch`


			`if __name__ == "__main__":`
			`parser = argparse.ArgumentParser()`
			`parser.add_argument(`
			`"--indir",`
			`type=str,`
			`nargs="?",`
			help="dir containing image-mask pairs (`example.png` and `example_mask.png`)",
			`)`
			`parser.add_argument(`
			`"--outdir",`
			`type=str,`
			`nargs="?",`
			`help="dir to write results to",`
			`)`
			`parser.add_argument(`
			`"--steps",`
			`type=int,`
			`default=50,`
			`help="number of ddim sampling steps",`
			`)`
			`opt = parser.parse_args()`

			`masks = sorted(glob.glob(os.path.join(opt.indir, "*_mask.png")))`
			`images = [x.replace("_mask.png", ".png") for x in masks]`
			`print(f"Found {len(masks)} inputs.")`

			`config = OmegaConf.load("models/ldm/inpainting_big/config.yaml")`
Revert "[dreambooth] fixing the incompatibity in requirements.txt (#3190) (#3378)" (#3481) 2023-04-06 12:22:52 +00:00			`model = instantiate_from_config(config.model)`
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`model.load_state_dict(torch.load("models/ldm/inpainting_big/last.ckpt")["state_dict"], strict=False)`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00
			`device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")`
			`model = model.to(device)`
			`sampler = DDIMSampler(model)`

			`os.makedirs(opt.outdir, exist_ok=True)`
			`with torch.no_grad():`
			`with model.ema_scope():`
			`for image, mask in tqdm(zip(images, masks)):`
			`outpath = os.path.join(opt.outdir, os.path.split(image)[1])`
			`batch = make_batch(image, mask, device=device)`

			`# encode masked image and concat downsampled mask`
			`c = model.cond_stage_model.encode(batch["masked_image"])`
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`cc = torch.nn.functional.interpolate(batch["mask"], size=c.shape[-2:])`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00			`c = torch.cat((c, cc), dim=1)`

[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`shape = (c.shape[1] - 1,) + c.shape[2:]`
			`samples_ddim, _ = sampler.sample(`
			`S=opt.steps, conditioning=c, batch_size=c.shape[0], shape=shape, verbose=False`
			`)`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00			`x_samples_ddim = model.decode_first_stage(samples_ddim)`

[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`image = torch.clamp((batch["image"] + 1.0) / 2.0, min=0.0, max=1.0)`
			`mask = torch.clamp((batch["mask"] + 1.0) / 2.0, min=0.0, max=1.0)`
			`predicted_image = torch.clamp((x_samples_ddim + 1.0) / 2.0, min=0.0, max=1.0)`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`inpainted = (1 - mask) * image + mask * predicted_image`
			`inpainted = inpainted.cpu().numpy().transpose(0, 2, 3, 1)[0] * 255`
[example] add stable diffuser (#1825) 2022-11-08 08:14:45 +00:00			`Image.fromarray(inpainted.astype(np.uint8)).save(outpath)`