ACE-Plus

Running on Zero

App Files Files Community

ACE-Plus / app.py

chaojiemao

Update app.py

34cf6b8 verified 6 days ago

raw

history blame

22.5 kB

	# -- coding: utf-8 --
	# Copyright (c) Alibaba, Inc. and its affiliates.
	import threading
	import time
	import gradio as gr
	import numpy as np
	import spaces
	import torch
	from PIL import Image
	import glob
	import os, csv, sys
	import shlex
	import subprocess
	subprocess.run("rm -rf /data-nvme/zerogpu-offload/*", env={}, shell=True)
	subprocess.run(shlex.split('pip install scepter'))
	subprocess.run(shlex.split('pip install numpy==1.26'))
	from scepter.modules.transform.io import pillow_convert
	from scepter.modules.utils.config import Config
	from scepter.modules.utils.distribute import we
	from scepter.modules.utils.file_system import FS
	from examples.examples import fft_examples
	from inference.registry import INFERENCES
	from inference.utils import edit_preprocess


	fs_list = [
	Config(cfg_dict={"NAME": "HuggingfaceFs", "TEMP_DIR": "./cache"}, load=False),
	Config(cfg_dict={"NAME": "ModelscopeFs", "TEMP_DIR": "./cache"}, load=False),
	Config(cfg_dict={"NAME": "HttpFs", "TEMP_DIR": "./cache"}, load=False),
	Config(cfg_dict={"NAME": "LocalFs", "TEMP_DIR": "./cache"}, load=False),
	]

	for one_fs in fs_list:
	FS.init_fs_client(one_fs)

	os.environ["FLUX_FILL_PATH"]="hf://black-forest-labs/FLUX.1-Fill-dev"
	os.environ["ACE_PLUS_FFT_MODEL"]="hf://ali-vilab/ACE_Plus@ace_plus_fft.safetensors"

	FS.get_dir_to_local_dir(os.environ["FLUX_FILL_PATH"])
	FS.get_from(os.environ["ACE_PLUS_FFT_MODEL"])

	csv.field_size_limit(sys.maxsize)
	refresh_sty = '\U0001f504' # 🔄
	clear_sty = '\U0001f5d1' # 🗑️
	upload_sty = '\U0001f5bc' # 🖼️
	sync_sty = '\U0001f4be' # 💾
	chat_sty = '\U0001F4AC' # 💬
	video_sty = '\U0001f3a5' # 🎥

	lock = threading.Lock()
	class DemoUI(object):
	#@spaces.GPU(duration=60)
	def __init__(self,
	infer_dir="./config/ace_plus_fft.yaml"
	):
	self.model_yamls = [infer_dir]
	self.model_choices = dict()
	self.default_model_name = ''
	self.edit_type_dict = {}
	self.edit_type_list = []
	self.default_type_list = []
	for i in self.model_yamls:
	model_cfg = Config(load=True, cfg_file=i)
	model_name = model_cfg.VERSION
	if model_cfg.IS_DEFAULT: self.default_model_name = model_name
	self.model_choices[model_name] = model_cfg
	for preprocessor in model_cfg.get("PREPROCESSOR", []):
	if preprocessor["TYPE"] in self.edit_type_dict:
	continue
	self.edit_type_dict[preprocessor["TYPE"]] = preprocessor
	self.default_type_list.append(preprocessor["TYPE"])
	print('Models: ', self.model_choices.keys())
	assert len(self.model_choices) > 0
	if self.default_model_name == "": self.default_model_name = list(self.model_choices.keys())[0]
	self.model_name = self.default_model_name
	pipe_cfg = self.model_choices[self.default_model_name]
	self.pipe = INFERENCES.build(pipe_cfg)
	# reformat examples
	self.all_examples = [
	[
	one_example["edit_type"], one_example["instruction"],
	one_example["input_reference_image"], one_example["input_image"],
	one_example["input_mask"], one_example["output_h"],
	one_example["output_w"], one_example["seed"]
	]
	for one_example in fft_examples
	]

	def construct_edit_image(self, edit_image, edit_mask):
	if edit_image is not None and edit_mask is not None:
	edit_image_rgb = pillow_convert(edit_image, "RGB")
	edit_image_rgba = pillow_convert(edit_image, "RGBA")
	edit_mask = pillow_convert(edit_mask, "L")

	arr1 = np.array(edit_image_rgb)
	arr2 = np.array(edit_mask)[:, :, np.newaxis]
	result_array = np.concatenate((arr1, arr2), axis=2)
	layer = Image.fromarray(result_array)

	ret_data = {
	"background": edit_image_rgba,
	"composite": edit_image_rgba,
	"layers": [layer]
	}
	return ret_data
	else:
	return None

	def create_ui(self):
	with gr.Row(equal_height=True, visible=True):
	with gr.Column(scale=2):
	self.gallery_image = gr.Image(
	height=600,
	interactive=False,
	type='pil',
	elem_id='Reference_image'
	)
	with gr.Column(scale=1, visible=True) as self.edit_preprocess_panel:
	with gr.Row():
	with gr.Accordion(label='Related Input Image', open=False):
	self.edit_preprocess_preview = gr.Image(
	height=600,
	interactive=False,
	type='pil',
	elem_id='preprocess_image',
	label='edit image'
	)

	self.edit_preprocess_mask_preview = gr.Image(
	height=600,
	interactive=False,
	type='pil',
	elem_id='preprocess_image_mask',
	label='edit mask'
	)

	self.change_preprocess_preview = gr.Image(
	height=600,
	interactive=False,
	type='pil',
	elem_id='preprocess_change_image',
	label='change image'
	)
	with gr.Row():
	instruction = """
	Instruction:
	Users can perform reference generation or editing tasks by uploading reference images
	and editing images. When uploading the editing image, various editing types are available
	for selection. Users can choose different dimensions of information preservation,
	such as edge information, color information, and more. Pre-processing information
	can be viewed in the 'related input image' tab.
	"""
	self.instruction = gr.Markdown(value=instruction)
	with gr.Row():
	self.icon = gr.Image(
	value=None,
	interactive=False,
	height=150,
	type='pil',
	elem_id='icon',
	label='icon'
	)
	with gr.Row():
	self.model_name_dd = gr.Dropdown(
	choices=self.model_choices,
	value=self.default_model_name,
	label='Model Version')
	self.edit_type = gr.Dropdown(choices=self.default_type_list,
	interactive=True,
	value=self.default_type_list[0],
	label='Edit Type')
	with gr.Row():
	self.step = gr.Slider(minimum=1,
	maximum=1000,
	value=self.pipe.input.get("sample_steps", 20),
	visible=self.pipe.input.get("sample_steps", None) is not None,
	label='Sample Step')
	self.cfg_scale = gr.Slider(
	minimum=1.0,
	maximum=100.0,
	value=self.pipe.input.get("guide_scale", 4.5),
	visible=self.pipe.input.get("guide_scale", None) is not None,
	label='Guidance Scale')
	self.seed = gr.Slider(minimum=-1,
	maximum=1000000000000,
	value=-1,
	label='Seed')
	self.output_height = gr.Slider(
	minimum=256,
	maximum=1440,
	value=self.pipe.input.get("image_size", [1024, 1024])[0],
	visible=self.pipe.input.get("image_size", None) is not None,
	label='Output Height')
	self.output_width = gr.Slider(
	minimum=256,
	maximum=1440,
	value=self.pipe.input.get("image_size", [1024, 1024])[1],
	visible=self.pipe.input.get("image_size", None) is not None,
	label='Output Width')

	self.repainting_scale = gr.Slider(
	minimum=0.0,
	maximum=1.0,
	value=self.pipe.input.get("repainting_scale", 1.0),
	visible=True,
	label='Repainting Scale')
	self.use_change = gr.Checkbox(
	value=self.pipe.input.get("use_change", True),
	visible=True,
	label='Use Change')
	self.keep_pixel = gr.Checkbox(
	value=self.pipe.input.get("keep_pixel", True),
	visible=True,
	label='Keep Pixels')
	self.keep_pixels_rate = gr.Slider(
	minimum=0.5,
	maximum=1.0,
	value=0.8,
	visible=True,
	label='keep_pixel rate')
	with gr.Row():
	self.generation_info_preview = gr.Markdown(
	label='System Log.',
	show_label=True)
	with gr.Row(variant='panel',
	equal_height=True,
	show_progress=False):
	with gr.Column(scale=10, min_width=500):
	self.text = gr.Textbox(
	placeholder='Input "@" find history of image',
	label='Instruction',
	container=False,
	lines=1)
	with gr.Column(scale=2, min_width=100):
	with gr.Row():
	with gr.Column(scale=1, min_width=100):
	self.chat_btn = gr.Button(value='Generate', variant="primary")

	with gr.Accordion(label='Advance', open=True):
	with gr.Row(visible=True):
	with gr.Column():
	self.reference_image = gr.Image(
	height=1000,
	interactive=True,
	image_mode='RGB',
	type='pil',
	label='Reference Image',
	elem_id='reference_image'
	)
	with gr.Column():
	self.edit_image = gr.ImageMask(
	height=1000,
	interactive=True,
	value=None,
	sources=['upload'],
	type='pil',
	layers=False,
	label='Edit Image',
	elem_id='image_editor',
	show_fullscreen_button=True,
	format="png"
	)

	with gr.Row():
	self.eg = gr.Column(visible=True)

	def set_callbacks(self, args, *kwargs):
	########################################
	def change_model(model_name):
	if model_name not in self.model_choices:
	gr.Info('The provided model name is not a valid choice!')
	return model_name, gr.update(), gr.update()

	if model_name != self.model_name:
	lock.acquire()
	del self.pipe
	torch.cuda.empty_cache()
	torch.cuda.ipc_collect()
	pipe_cfg = self.model_choices[model_name]
	self.pipe = INFERENCES.build(pipe_cfg)
	self.model_name = model_name
	lock.release()

	return (model_name, gr.update(),
	gr.Slider(
	value=self.pipe.input.get("sample_steps", 20),
	visible=self.pipe.input.get("sample_steps", None) is not None),
	gr.Slider(
	value=self.pipe.input.get("guide_scale", 4.5),
	visible=self.pipe.input.get("guide_scale", None) is not None),
	gr.Slider(
	value=self.pipe.input.get("image_size", [1024, 1024])[0],
	visible=self.pipe.input.get("image_size", None) is not None),
	gr.Slider(
	value=self.pipe.input.get("image_size", [1024, 1024])[1],
	visible=self.pipe.input.get("image_size", None) is not None),
	gr.Slider(value=self.pipe.input.get("repainting_scale", 1.0))
	)

	self.model_name_dd.change(
	change_model,
	inputs=[self.model_name_dd],
	outputs=[
	self.model_name_dd, self.text,
	self.step,
	self.cfg_scale,
	self.output_height,
	self.output_width,
	self.repainting_scale])

	def change_edit_type(edit_type):
	edit_info = self.edit_type_dict[edit_type]
	edit_info = edit_info or {}
	repainting_scale = edit_info.get("REPAINTING_SCALE", 1.0)
	return gr.Slider(value=repainting_scale)

	self.edit_type.change(change_edit_type, inputs=[self.edit_type], outputs=[self.repainting_scale])

	def resize_image(image, h):
	ow, oh = image.size
	w = int(h * ow / oh)
	image = image.resize((w, h), Image.LANCZOS)
	return image

	def preprocess_input(ref_image, edit_image_dict, preprocess=None):
	err_msg = ""
	is_suc = True
	if ref_image is not None:
	ref_image = pillow_convert(ref_image, "RGB")

	if edit_image_dict is None:
	edit_image = None
	edit_mask = None
	else:
	edit_image = edit_image_dict["background"]
	edit_mask = np.array(edit_image_dict["layers"][0])[:, :, 3]
	if np.sum(np.array(edit_image)) < 1:
	edit_image = None
	edit_mask = None
	elif np.sum(np.array(edit_mask)) < 1:
	edit_image = pillow_convert(edit_image, "RGB")
	w, h = edit_image.size
	edit_mask = Image.new("L", (w, h), 255)
	else:
	edit_image = pillow_convert(edit_image, "RGB")
	edit_mask = Image.fromarray(edit_mask).convert('L')
	if ref_image is None and edit_image is None:
	err_msg = "Please provide the reference image or edited image."
	return None, None, None, False, err_msg
	return edit_image, edit_mask, ref_image, is_suc, err_msg

	@spaces.GPU(duration=80)
	def run_chat(
	prompt,
	ref_image,
	edit_image,
	edit_type,
	cfg_scale,
	step,
	seed,
	output_h,
	output_w,
	repainting_scale,
	use_change,
	keep_pixel,
	keep_pixels_rate,
	progress=gr.Progress(track_tqdm=True)
	):
	edit_info = self.edit_type_dict[edit_type]
	pre_edit_image, pre_edit_mask, pre_ref_image, is_suc, err_msg = preprocess_input(ref_image, edit_image)
	icon = pre_edit_image or pre_ref_image
	if not is_suc:
	err_msg = f"<mark>{err_msg}</mark>"
	return (gr.Image(), gr.Column(visible=True),
	gr.Image(),
	gr.Image(),
	gr.Image(),
	gr.Text(value=err_msg))
	pre_edit_image = edit_preprocess(edit_info.ANNOTATOR, we.device_id, pre_edit_image, pre_edit_mask)
	# edit_image["background"] = pre_edit_image
	st = time.time()
	image, edit_image, change_image, mask, seed = self.pipe(
	reference_image=pre_ref_image,
	edit_image=pre_edit_image,
	edit_mask=pre_edit_mask,
	prompt=prompt,
	output_height=output_h,
	output_width=output_w,
	sampler='flow_euler',
	sample_steps=step,
	guide_scale=cfg_scale,
	seed=seed,
	repainting_scale=repainting_scale,
	use_change=use_change,
	keep_pixels=keep_pixel,
	keep_pixels_rate=keep_pixels_rate
	)
	et = time.time()
	msg = f"prompt: {prompt}; seed: {seed}; cost time: {et - st}s; repaiting scale: {repainting_scale}"

	if icon is not None:
	icon = resize_image(icon, 150)

	return (gr.Image(value=image), gr.Column(visible=True),
	gr.Image(value=edit_image if edit_image is not None else edit_image),
	gr.Image(value=change_image),
	gr.Image(value=pre_edit_mask if pre_edit_mask is not None else None),
	gr.Text(value=msg),
	gr.Image(value=icon))

	chat_inputs = [
	self.reference_image,
	self.edit_image,
	self.edit_type,
	self.cfg_scale,
	self.step,
	self.seed,
	self.output_height,
	self.output_width,
	self.repainting_scale,
	self.use_change,
	self.keep_pixel,
	self.keep_pixels_rate
	]

	chat_outputs = [
	self.gallery_image, self.edit_preprocess_panel, self.edit_preprocess_preview,
	self.change_preprocess_preview,
	self.edit_preprocess_mask_preview, self.generation_info_preview,
	self.icon
	]

	self.chat_btn.click(run_chat,
	inputs=[self.text] + chat_inputs,
	outputs=chat_outputs,
	queue=True)

	self.text.submit(run_chat,
	inputs=[self.text] + chat_inputs,
	outputs=chat_outputs,
	queue=True)

	@spaces.GPU(duration=80)
	def run_example(edit_type, prompt, ref_image, edit_image, edit_mask,
	output_h, output_w, seed, use_change, keep_pixel,
	keep_pixels_rate,
	progress=gr.Progress(track_tqdm=True)):

	step = self.pipe.input.get("sample_steps", 20)
	cfg_scale = self.pipe.input.get("guide_scale", 20)
	edit_info = self.edit_type_dict[edit_type]

	edit_image = self.construct_edit_image(edit_image, edit_mask)

	pre_edit_image, pre_edit_mask, pre_ref_image, _, _ = preprocess_input(ref_image, edit_image)

	icon = pre_edit_image or pre_ref_image

	pre_edit_image = edit_preprocess(edit_info.ANNOTATOR, we.device_id, pre_edit_image, pre_edit_mask)
	edit_info = edit_info or {}
	repainting_scale = edit_info.get("REPAINTING_SCALE", 1.0)
	st = time.time()
	image, edit_image, change_image, mask, seed = self.pipe(
	reference_image=pre_ref_image,
	edit_image=pre_edit_image,
	edit_mask=pre_edit_mask,
	prompt=prompt,
	output_height=output_h,
	output_width=output_w,
	sampler='flow_euler',
	sample_steps=step,
	guide_scale=cfg_scale,
	seed=seed,
	repainting_scale=repainting_scale,
	use_change=use_change,
	keep_pixels=keep_pixel,
	keep_pixels_rate=keep_pixels_rate
	)
	et = time.time()
	msg = f"prompt: {prompt}; seed: {seed}; cost time: {et - st}s; repaiting scale: {repainting_scale}"
	if pre_edit_image is not None:
	ret_image = Image.composite(Image.new("RGB", pre_edit_image.size, (0, 0, 0)), pre_edit_image,
	pre_edit_mask)
	else:
	ret_image = None

	if icon is not None:
	icon = resize_image(icon, 150)
	return (gr.Image(value=image), gr.Column(visible=True),
	gr.Image(value=edit_image if edit_image is not None else edit_image),
	gr.Image(value=change_image),
	gr.Image(value=pre_edit_mask if pre_edit_mask is not None else None),
	gr.Text(value=msg),
	gr.update(value=ret_image),
	gr.Image(value=icon))

	with self.eg:
	self.example_edit_image = gr.Image(label='Edit Image',
	type='pil',
	image_mode='RGB',
	visible=False)
	self.example_edit_mask = gr.Image(label='Edit Image Mask',
	type='pil',
	image_mode='L',
	visible=False)

	self.examples = gr.Examples(
	fn=run_example,
	examples=self.all_examples,
	inputs=[
	self.edit_type, self.text, self.reference_image, self.example_edit_image,
	self.example_edit_mask, self.output_height, self.output_width, self.seed,
	self.use_change, self.keep_pixel, self.keep_pixels_rate
	],
	outputs=[self.gallery_image, self.edit_preprocess_panel, self.edit_preprocess_preview,
	self.change_preprocess_preview,
	self.edit_preprocess_mask_preview, self.generation_info_preview,
	self.edit_image,
	self.icon],
	examples_per_page=15,
	cache_examples=False,
	run_on_click=True)


	if __name__ == '__main__':
	with gr.Blocks() as demo:
	chatbot = DemoUI()
	chatbot.create_ui()
	chatbot.set_callbacks()
	demo.launch()