Spaces:

IDKiro
/

SDXS-512-Dreamshaper-Anime

Paused

File size: 4,509 Bytes

import spaces
import base64
from io import BytesIO

import gradio as gr
import PIL.Image
import torch

from diffusers import StableDiffusionPipeline, AutoencoderKL, AutoencoderTiny
from peft import PeftModel

device = "cuda"
weight_type = torch.float16

pipe = StableDiffusionPipeline.from_pretrained("IDKiro/sdxs-512-dreamshaper")
pipe.unet = PeftModel.from_pretrained(pipe.unet, "IDKiro/sdxs-512-dreamshaper-anime")
pipe.unet.merge_and_unload()
pipe.to(device, dtype=weight_type)

vae_tiny = AutoencoderTiny.from_pretrained(
    "IDKiro/sdxs-512-dreamshaper", subfolder="vae"
)
vae_tiny.to(device, dtype=weight_type)

vae_large = AutoencoderKL.from_pretrained(
    "IDKiro/sdxs-512-dreamshaper", subfolder="vae_large"
)
vae_tiny.to(device, dtype=weight_type)


def pil_image_to_data_url(img, format="PNG"):
    buffered = BytesIO()
    img.save(buffered, format=format)
    img_str = base64.b64encode(buffered.getvalue()).decode()
    return f"data:image/{format.lower()};base64,{img_str}"


@spaces.GPU
def run(
    prompt: str,
    device_type="GPU",
    vae_type=None,
    param_dtype="torch.float16",
) -> PIL.Image.Image:
    if vae_type == "tiny vae":
        pipe.vae = vae_tiny
    elif vae_type == "large vae":
        pipe.vae = vae_large

    if device_type == "CPU":
        device = "cpu"
        param_dtype = "torch.float32"
    else:
        device = "cuda"

    pipe.to(
        torch_device=device,
        torch_dtype=torch.float16 if param_dtype == "torch.float16" else torch.float32,
    )

    result = pipe(
        prompt=prompt,
        guidance_scale=0.0,
        num_inference_steps=1,
        output_type="pil",
    ).images[0]

    result_url = pil_image_to_data_url(result)

    return (result, result_url)


examples = [
    "A photo of beautiful mountain with realistic sunset and blue lake, highly detailed, masterpiece",
]

with gr.Blocks(css="style.css") as demo:
    gr.Markdown("# SDXS-512-DreamShaper-Anime")
    gr.Markdown("[SDXS: Real-Time One-Step Latent Diffusion Models with Image Conditions](https://arxiv.org/abs/2403.16627) | [GitHub](https://github.com/IDKiro/sdxs)")
    with gr.Group():
        with gr.Row():
            with gr.Column(min_width=685):
                with gr.Row():
                    prompt = gr.Text(
                        label="Prompt",
                        show_label=False,
                        max_lines=1,
                        placeholder="Enter your prompt",
                        container=False,
                    )
                    run_button = gr.Button("Run", scale=0)

                device_choices = ["GPU", "CPU"]
                device_type = gr.Radio(
                    device_choices,
                    label="Device",
                    value=device_choices[0],
                    interactive=True,
                    info="Thanks to the community for the GPU!",
                )

                vae_choices = ["tiny vae", "large vae"]
                vae_type = gr.Radio(
                    vae_choices,
                    label="Image Decoder Type",
                    value=vae_choices[0],
                    interactive=True,
                    info="To save GPU memory, use tiny vae. For better quality, use large vae.",
                )

                dtype_choices = ["torch.float16", "torch.float32"]
                param_dtype = gr.Radio(
                    dtype_choices,
                    label="torch.weight_type",
                    value=dtype_choices[0],
                    interactive=True,
                    info="To save GPU memory, use torch.float16. For better quality, use torch.float32.",
                )

                download_output = gr.Button(
                    "Download output", elem_id="download_output"
                )

            with gr.Column(min_width=512):
                result = gr.Image(
                    label="Result",
                    height=512,
                    width=512,
                    elem_id="output_image",
                    show_label=False,
                    show_download_button=True,
                )

    gr.Examples(examples=examples, inputs=prompt, outputs=result, fn=run)

    demo.load(None, None, None)

    inputs = [prompt, device_type, vae_type, param_dtype]
    outputs = [result, download_output]
    prompt.submit(fn=run, inputs=inputs, outputs=outputs)
    run_button.click(fn=run, inputs=inputs, outputs=outputs)

if __name__ == "__main__":
    demo.queue().launch(debug=True)