Spaces:

hostin
/

txt2img

Runtime error

App Files Files Community

txt2img / app.py

hostin

Create app.py

2e2639d verified 4 months ago

raw

history blame

4.8 kB

	# @title 📸 Image Generation (multimodel + Gradio Web Interface)

	# Install Dependencies
	!pip install transformers torch diffusers accelerate invisible_watermark safetensors huggingface-hub gradio --quiet

	from diffusers import DiffusionPipeline, StableDiffusionPipeline
	import torch
	from gradio.components import Gallery
	from PIL import Image
	from IPython.display import display
	import os
	from datetime import datetime
	import gradio as gr

	# Function to generate and display images
	def generate_and_display_images(model_selection, scenery, style, height, width, num_images=2, n_steps=50, high_noise_frac=0.5, guidance_scale=2.6, negative_prompt="", seed=None):
	if seed is None or seed == '':
	seed = torch.randint(low=0, high=2**32, size=(1,)).item()
	else:
	try:
	seed = int(seed)
	except ValueError:
	return "Invalid seed value. Seed must be an integer."
	torch.manual_seed(seed)

	prompt = f"Scenery: {scenery}; Style: {style}"

	generated_images = []
	if model_selection == "dreamlike-art/dreamlike-photoreal-2.0":
	model = StableDiffusionPipeline.from_pretrained(model_selection, torch_dtype=torch.float16).to("cuda")
	for _ in range(num_images):
	image = model(prompt=prompt, num_inference_steps=n_steps, guidance_scale=guidance_scale, negative_prompt=negative_prompt, height=height, width=width).images[0]
	generated_images.append(image)
	else:
	base = DiffusionPipeline.from_pretrained(model_selection, torch_dtype=torch.float16, use_auth_token=True).to("cuda")
	for _ in range(num_images):
	if "refiner" in model_selection:
	image_latent = base(prompt=prompt, num_inference_steps=n_steps, denoising_end=high_noise_frac, output_type="latent").images
	image = image_latent[0] # Placeholder for actual refiner step
	else:
	image = base(prompt=prompt, num_inference_steps=n_steps, guidance_scale=guidance_scale, negative_prompt=negative_prompt, height=height, width=width).images[0]
	generated_images.append(image)

	# Save images and return file paths for Gradio display
	file_paths = []
	for i, image in enumerate(generated_images):
	timestamp = datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
	filename = f"{seed}_{timestamp}_{i}.jpg"
	image.save(filename)
	file_paths.append(filename)

	return file_paths



	# Define Gradio interface
	iface = gr.Interface(
	fn=generate_and_display_images,
	inputs=[
	gr.components.Dropdown(choices=["stabilityai/sdxl-turbo", "stabilityai/stable-diffusion-xl-base-1.0", "runwayml/stable-diffusion-v1-5", "dreamlike-art/dreamlike-photoreal-2.0", "Kardbord/stable-diffusion-v1-5-unsafe"], label="Model Selection"),
	gr.components.Textbox(label="Scenery", placeholder="Describe the scenery you want in the image"),
	gr.components.Textbox(label="Style", placeholder="Describe the style of the image (e.g., photorealistic, liminal, dark)"),
	gr.components.Slider(minimum=1, maximum=2048, step=1, value=1024, label="Height"),
	gr.components.Slider(minimum=1, maximum=2048, step=1, value=576, label="Width"),
	gr.components.Number(value=10, label="Number of Images"),
	gr.components.Slider(minimum=0, maximum=60, step=1, value=30, label="Number of Inference Steps"),
	gr.components.Slider(minimum=0.0, maximum=1.0, step=0.01, value=0.16, label="High Noise Fraction"),
	gr.components.Slider(minimum=0.0, maximum=10.0, step=0.1, value=8, label="Guidance Scale"),
	gr.components.Textbox(value="", label="Negative Prompt"),
	gr.components.Textbox(value=None, label="Seed (Optional)")
	],
	outputs=Gallery(label="Generated Images"),
	examples=[["dreamlike-art/dreamlike-photoreal-2.0", "scenery : melting flesh", "style : (((photorealistic))), liminal, cryptic, cinematic, highly detailed, sharp focus, dark, creepy, weirdcore", 1024, 576, 10, 30, 0.16, 8, "2D \|\| naked \|\| Low Quality \|\| text logos \|\| watermarks \|\| signatures \|\| out of frame \|\| jpeg artifacts \|\| ugly \|\| poorly drawn \|\| extra limbs \|\| extra hands \|\| extra feet \|\| backwards limbs \|\| extra fingers \|\| extra toes \|\| unrealistic, incorrect, bad anatomy \|\| cut off body pieces \|\| strange body positions \|\| impossible body positioning \|\| Mismatched eyes \|\| cross eyed \|\| crooked face \|\| crooked lips \|\| unclear \|\| undefined \|\| mutations \|\| deformities \|\| off center \|\| poor_composition \|\| duplicate faces, blurry, blurred, unclear, deformed anatomy, deformed face, crazy eyes, bad hands, deformed body", None]],
	title="Image Generation Tool",
	description="Generate images using various diffusion models."
	)

	# Launch the interface
	iface.launch(share=True, debug=True)