zero123plus / examples /text_to_img.py
eliphatfs
Add demo.
798f776
raw
history blame contribute delete
839 Bytes
from diffusers import StableDiffusionXLPipeline
import torch
import rembg
# text-to-image with SDXL for text-to-image-to-3d
pipeline = StableDiffusionXLPipeline.from_single_file(
"https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0/blob/main/sd_xl_base_1.0.safetensors",
torch_dtype=torch.float16,
variant="fp16",
use_safetensors=True
).to("cuda")
pipeline.enable_model_cpu_offload()
num_images_per_prompt = 1
res = 1024
text = input("Prompt > ")
bkgd_color = "white"
prompt = f"a ((full-body:2)) shot of a ((single:2)) {text}, isolated on {bkgd_color} background, 4k, highly detailed"
images = pipeline(prompt=prompt, num_images_per_prompt=num_images_per_prompt, height=res, width=res).images
image = images[0]
image.show()
image.save("output.png")
image = rembg.remove(image)
image.save("output-rembg.png")