ApoorvBrooklyn
/

stable-diffusion-implementation

stable-diffusion

diffusion-models

computer-vision

neural-networks

Model card Files Files and versions

stable-diffusion-implementation / demo.py

ApoorvBrooklyn's picture

Upload folder using huggingface_hub

8d87bff verified 3 months ago

1.91 kB

	import model_loader
	import pipeline
	from PIL import Image
	from pathlib import Path
	from transformers import CLIPTokenizer
	import torch

	DEVICE = "cpu"

	ALLOW_CUDA = False
	ALLOW_MPS = False

	if torch.cuda.is_available() and ALLOW_CUDA:
	DEVICE = "cuda"
	elif (torch.has_mps or torch.backends.mps.is_available()) and ALLOW_MPS:
	DEVICE = "mps"
	print(f"Using device: {DEVICE}")

	tokenizer = CLIPTokenizer("../data/vocab.json", merges_file="../data/merges.txt")
	model_file = "../data/v1-5-pruned-emaonly.ckpt"
	models = model_loader.preload_models_from_standard_weights(model_file, DEVICE)

	## TEXT TO IMAGE

	# prompt = "A dog with sunglasses, wearing comfy hat, looking at camera, highly detailed, ultra sharp, cinematic, 100mm lens, 8k resolution."
	prompt = "A boy playing football with his teammates."
	uncond_prompt = "" # Also known as negative prompt
	do_cfg = True
	cfg_scale = 8 # min: 1, max: 14

	## IMAGE TO IMAGE

	input_image = None
	# Comment to disable image to image
	image_path = "../images/dog.jpg"
	# input_image = Image.open(image_path)
	# Higher values means more noise will be added to the input image, so the result will further from the input image.
	# Lower values means less noise is added to the input image, so output will be closer to the input image.
	strength = 0.9

	## SAMPLER

	sampler = "ddpm"
	num_inference_steps = 50
	seed = 42

	output_image = pipeline.generate(
	prompt=prompt,
	uncond_prompt=uncond_prompt,
	input_image=input_image,
	strength=strength,
	do_cfg=do_cfg,
	cfg_scale=cfg_scale,
	sampler_name=sampler,
	n_inference_steps=num_inference_steps,
	seed=seed,
	models=models,
	device=DEVICE,
	idle_device="cpu",
	tokenizer=tokenizer,
	)

	# Combine the input image and the output image into a single image.
	Image.fromarray(output_image)
	result_img = Image.fromarray(output_image)
	result_img.save("output.png")
	print("Saved output.png")