Spaces:

armikaeili
/

cora

Running on Zero

App Files Files Community

cora / app.py

armikaeili

loading model bug fix

0a1f404 2 months ago

raw

history blame contribute delete

7.2 kB

	import gradio as gr
	import spaces

	from PIL import Image

	import numpy as np
	import torch
	import torch.nn.functional as F

	from utils.pipeline_utils import load_pipeline
	from utils import get_args

	from main import run

	pipeline = load_pipeline(fp16=False, cache_dir=None)



	def process_masks(masks):
	# masks: list of file paths
	processed_masks = []
	mask_composit = torch.zeros((512, 512), dtype=torch.float32, device='cuda')
	for mask_path in masks:
	mask = Image.open(mask_path).convert("L").resize((512, 512))
	mask = torch.tensor(np.array(mask), dtype=torch.float32, device='cuda')
	mask[mask > 0] = 255.0
	mask = mask / 255.0
	processed_masks.append(mask)
	mask_composit += mask
	mask_composit = torch.clamp(mask_composit, 0, 1)
	mask_composit = F.interpolate(mask_composit[None, None, :, :], size=(64, 64), mode="nearest")[0, 0]
	if mask_composit.sum() == 0:
	mask_composit = None

	return mask_composit


	@spaces.GPU
	def main_pipeline(
	input_image: str,
	src_prompt: str,
	tgt_prompt: str,
	alpha: float,
	beta: float,
	w1: float,
	seed: int,
	dift_correction: bool = True,
	):
	args = get_args()
	args.alpha = alpha
	args.beta = beta
	args.w1 = w1
	args.seed = seed
	args.structural_alignment = True
	args.support_new_object = True
	args.apply_dift_correction = dift_correction
	torch.cuda.empty_cache()
	res_image = run(input_image['background'], src_prompt, tgt_prompt, masks=process_masks(input_image['layers']),
	pipeline=pipeline, args=args)[2]

	return res_image


	DESCRIPTION = """# Cora 🖼️🐱🦅
	## Fast & Controllable Image Editing
	### 🛠️ Quick start
	1. Upload or drag-and-drop the image you’d like to edit.
	2. Source prompt – describe what’s in the original image.
	3. Target prompt – describe the result you want.
	4. Adjust the parameters as needed.
	5. (Optional) Paint a mask to specify the area to edit.
	6. Click Edit and wait a few seconds for the output.
	### ⚙️ Parameter cheat-sheet
	\| Parameter \| What it does \| `0` (minimum) \| `1` (maximum) \|
	\|-----------\|--------------\|---------------\|---------------\|
	\| alpha \| Appearance transfer control \| preserve source appearance \| target prompt affects appearance \|
	\| beta \| Structural change control \| preserve original structure \| full layout change \|
	\| w \| Prompt strength \| subtle tweaks \| strong changes \|
	\| Seed \| Fixes randomness for reproducibility \| – \| – \|
	\| Apply correspondence correction \| Uses correspondence-aware latent fix \| – \| – \|
	### 📜 Tips
	- To replicate TurboEdit, set alpha = 1, beta = 1, and turn off Apply correspondence correction.
	- To test reconstruction quality of the inversion, use identical source & target prompts with alpha = 1, beta = 1, and w = 1.
	#### 🙏 Acknowledgements
	The demo template is largely adapted from [TurboEdit on Hugging Face Spaces](https://huggingface.co/spaces/turboedit/turbo_edit).
	"""

	with gr.Blocks(css="app/style.css") as demo:
	gr.HTML(
	"""<a href="https://huggingface.co/spaces/armikaeili/cora?duplicate=true">
	<img src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a>Duplicate the Space to run privately without waiting in queue"""
	)
	gr.Markdown(DESCRIPTION)

	with gr.Row():
	with gr.Column():
	input_image = gr.ImageMask(
	label="Input image", type="filepath", height=512, width=512, brush=gr.Brush(color_mode='defaults')
	)
	result = gr.Image(label="Result", type="pil", height=512, width=512)
	with gr.Column():
	src_prompt = gr.Text(
	label="Source Prompt",
	max_lines=1,
	placeholder="Source Prompt",
	)
	tgt_prompt = gr.Text(
	label="Target Prompt",
	max_lines=1,
	placeholder="Target Prompt",
	)
	with gr.Accordion("Advanced Options", open=False):
	seed = gr.Slider(
	label="seed", minimum=0, maximum=16 * 1024, value=200, step=1
	)
	w1 = gr.Slider(
	label="w", minimum=1.0, maximum=3.0, value=1.9, step=0.05
	)
	alpha = gr.Slider(
	label="alpha", minimum=0, maximum=1, value=0, step=0.01
	)
	beta = gr.Slider(
	label="beta", minimum=0, maximum=1, value=0.04, step=0.01
	)
	with gr.Row():
	dift_correction = gr.Checkbox(
	label="Apply correspondence correction",
	value=True)
	run_button = gr.Button("Edit")

	examples = [
	[
	"assets/white_cat.png", # input_image
	"a cat", # src_prompt
	"a cat wearing a suit", # tgt_prompt
	0.1, # alpha
	0.1, # beta
	1.9, # w1
	7, # seed
	True # dift_correction
	],
	[
	"assets/bear.png", # input_image
	"a sitting brown bear", # src_prompt
	"a roaring blue bear", # tgt_prompt
	0.7, # alpha
	0.1, # beta
	1.9, # w1
	7, # seed
	True # dift_correction
	],
	[
	"assets/cat.jpg", # input_image
	"a cat", # src_prompt
	"an eagle", # tgt_prompt
	0.7, # alpha
	0.3, # beta
	1.9, # w1
	7, # seed
	True # dift_correction
	],
	[
	"assets/dog.png", # input_image
	"a photo of a dog", # src_prompt
	"a photo of a dog lying", # tgt_prompt
	0.0, # alpha
	1, # beta
	1.9, # w1
	7, # seed
	True # dift_correction
	],

	]

	inputs = [
	input_image,
	src_prompt,
	tgt_prompt,
	alpha,
	beta,
	w1,
	seed,
	dift_correction
	]
	outputs = [result]
	#
	gr.Examples(
	examples=examples,
	inputs=inputs,
	outputs=outputs,
	fn=main_pipeline,
	cache_examples=False,
	)

	run_button.click(fn=main_pipeline, inputs=inputs, outputs=outputs)
	demo.queue(max_size=50).launch(share=False)