File size: 2,688 Bytes

e58dd86
 
 
 
 
 
b88c59f
 
 
e58dd86
 
 
c51632b
e58dd86
ee24263
e58dd86
 
 
 
 
 
ee24263
 
 
 
 
 
 
 
 
 
e58dd86
ee24263
b88c59f
ee24263
 
 
 
 
 
 
 
 
 
 
 
 
 
e58dd86
6ed2376
 
ee24263
 
e58dd86
 
ee24263
 
 
 
 
 
 
 
e58dd86
ee24263
 
e58dd86
ee24263

#!/usr/bin/env python3
import torch
import os
from huggingface_hub import HfApi
from pathlib import Path
from diffusers.utils import load_image
import cv2
from PIL import Image
import numpy as np

from diffusers import (
    ControlNetModel,
    EulerDiscreteScheduler,
    StableDiffusionControlNetPipeline,
    StableDiffusionXLControlNetPipeline,
    UniPCMultistepScheduler,
)
import sys

checkpoint = sys.argv[1]

prompts = [
    "beautiful room",
    "a photo-realistic image of two paradise birds",
    "a snowy house behind a forest",
    "a couple watching a romantic sunset",
    "boats in the Amazonas",
    "a photo of a beautiful face of a woman",
    "a skater in Brooklyn",
    "a tornado in Iowa"
]

sd_xl = "control_v11p" not in checkpoint

if sd_xl:
    base_ckpt = "stabilityai/stable-diffusion-xl-base-0.9"
    controlnet = ControlNetModel.from_pretrained(checkpoint, torch_dtype=torch.float16)
    pipe = StableDiffusionXLControlNetPipeline.from_pretrained(
        base_ckpt, controlnet=controlnet, torch_dtype=torch.float16
    )
    size = 1024
else:
    base_ckpt = "runwayml/stable-diffusion-v1-5"
    controlnet = ControlNetModel.from_pretrained(checkpoint, torch_dtype=torch.float16)
    pipe = StableDiffusionControlNetPipeline.from_pretrained(
        base_ckpt, controlnet=controlnet, torch_dtype=torch.float16
    )
    size = 512

import ipdb; ipdb.set_trace()

# pipe.enable_model_cpu_offload()
pipe.to("cuda")


for i in range(8):
    for seed in range(4):
        image = load_image(
            f"https://huggingface.co/datasets/patrickvonplaten/webdatasets_images/resolve/main/image_{i}.png"
        )
        image = image.resize((size, size))
        prompt = prompts[i]
        image = np.array(image)

        low_threshold = 100
        high_threshold = 200

        image = cv2.Canny(image, low_threshold, high_threshold)
        image = image[:, :, None]
        image = np.concatenate([image, image, image], axis=2)
        canny_image = Image.fromarray(image)

        generator = torch.manual_seed(seed)
        out_image = pipe(prompt, generator=generator, num_inference_steps=20, image=canny_image, controlnet_conditioning_scale=1.0).images[0]

        path = os.path.join(Path.home(), "images", "control_sdxl", f"{i}_{seed}.png")
        path_in_repo = "/".join(path.split("/")[-2:])
        out_image.save(path)

        api = HfApi()

        api.upload_file(
            path_or_fileobj=path,
            path_in_repo=path_in_repo,
            repo_id="patrickvonplaten/images",
            repo_type="dataset",
        )
        print(f"https://huggingface.co/datasets/patrickvonplaten/images/blob/main/control_sdxl/{i}_{seed}.png")