style-aligned-controlnet

Runtime error

App Files Files Community

ysharma HF staff commited on Dec 7, 2023

Commit

420a964

•

1 Parent(s): 4b1b707

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -28

app.py CHANGED Viewed

@@ -3,14 +3,12 @@ from diffusers import ControlNetModel, StableDiffusionXLControlNetPipeline, Auto
 from diffusers.utils import load_image
 from transformers import DPTImageProcessor, DPTForDepthEstimation
 import torch
-import mediapy
 import sa_handler
 import pipeline_calls
-# init models
 depth_estimator = DPTForDepthEstimation.from_pretrained("Intel/dpt-hybrid-midas").to("cuda")
 feature_processor = DPTImageProcessor.from_pretrained("Intel/dpt-hybrid-midas")
@@ -29,9 +27,11 @@ pipeline = StableDiffusionXLControlNetPipeline.from_pretrained(
     use_safetensors=True,
     torch_dtype=torch.float16,
 ).to("cuda")
 pipeline.enable_model_cpu_offload()
 pipeline.enable_vae_slicing()
 sa_args = sa_handler.StyleAlignedArgs(share_group_norm=False,
                                       share_layer_norm=False,
                                       share_attention=True,
@@ -43,50 +43,56 @@ handler = sa_handler.Handler(pipeline)
 handler.register(sa_args, )
-# run ControlNet depth with StyleAligned
 def style_aligned_controlnet(ref_style_prompt, depth_map, ref_image, img_generation_prompt):
-    if depth_map == True:
-        image = load_image(ref_image)
-        depth_image = pipeline_calls.get_depth_map(image, feature_processor, depth_estimator)
-    else:
-        depth_image = load_image(ref_image).resize((1024, 1024))
-    controlnet_conditioning_scale = 0.8
-    num_images_per_prompt = 3 # adjust according to VRAM size
-    latents = torch.randn(1 + num_images_per_prompt, 4, 128, 128).to(pipeline.unet.dtype)
-    latents[1:] = torch.randn(num_images_per_prompt, 4, 128, 128).to(pipeline.unet.dtype)
-    images = pipeline_calls.controlnet_call(pipeline, [ref_style_prompt, img_generation_prompt],
-                                            image=depth_image,
-                                            num_inference_steps=50,
-                                            controlnet_conditioning_scale=controlnet_conditioning_scale,
-                                            num_images_per_prompt=num_images_per_prompt,
-                                            latents=latents)
-    #mediapy.show_images([images[0], depth_image2] +  images[1:], titles=["reference", "depth"] + [f'result {i}' for i in range(1, len(images))])
-    return [images[0], depth_image] +  images[1:], gr.Image(value=images[0], visible=True)
 with gr.Blocks() as demo:
     gr.HTML('<h1 style="text-align: center;">Style-aligned with ControlNet Depth</h1>')
     with gr.Row():
       with gr.Column(variant='panel'):
         ref_style_prompt = gr.Textbox(
           label='Reference style prompt',
           info="Enter a Prompt to generate the reference image", placeholder='a poster in <style name> style'
         )
         depth_map = gr.Checkbox(label='Depth-map',)
         ref_style_image = gr.Image(visible=False, label='Reference style image')
       with gr.Column(variant='panel'):
         ref_image = gr.Image(label="Upload the reference image",
                              type='filepath' )
         img_generation_prompt = gr.Textbox(
             label='ControlNet Prompt',
             info="Enter a Prompt to generate images using ControlNet and Style-aligned",
             )
     btn = gr.Button("Generate", size='sm')
     gallery = gr.Gallery(label="Style-Aligned ControlNet - Generated images",
                            elem_id="gallery",
                            columns=5,
@@ -101,7 +107,7 @@ with gr.Blocks() as demo:
               api_name="style_aligned_controlnet")
     gr.Examples(
       examples=[
         ['A poster in a papercut art style.', False, 'example_image/A.png', 'Letter A in a papercut art style.'],
@@ -116,5 +122,5 @@ with gr.Blocks() as demo:
       fn=style_aligned_controlnet,
       )
 demo.launch()

 from diffusers.utils import load_image
 from transformers import DPTImageProcessor, DPTForDepthEstimation
 import torch
 import sa_handler
 import pipeline_calls
+# Initialize models
 depth_estimator = DPTForDepthEstimation.from_pretrained("Intel/dpt-hybrid-midas").to("cuda")
 feature_processor = DPTImageProcessor.from_pretrained("Intel/dpt-hybrid-midas")
     use_safetensors=True,
     torch_dtype=torch.float16,
 ).to("cuda")
+# Configure pipeline for CPU offloading and VAE slicing
 pipeline.enable_model_cpu_offload()
 pipeline.enable_vae_slicing()
+# Initialize style-aligned handler
 sa_args = sa_handler.StyleAlignedArgs(share_group_norm=False,
                                       share_layer_norm=False,
                                       share_attention=True,
 handler.register(sa_args, )
+# Function to run ControlNet depth with StyleAligned
 def style_aligned_controlnet(ref_style_prompt, depth_map, ref_image, img_generation_prompt):
+    try:
+        if depth_map == True:
+            image = load_image(ref_image)
+            depth_image = pipeline_calls.get_depth_map(image, feature_processor, depth_estimator)
+        else:
+            depth_image = load_image(ref_image).resize((1024, 1024))
+        controlnet_conditioning_scale = 0.8
+        num_images_per_prompt = 3 # adjust according to VRAM size
+        latents = torch.randn(1 + num_images_per_prompt, 4, 128, 128).to(pipeline.unet.dtype)
+        latents[1:] = torch.randn(num_images_per_prompt, 4, 128, 128).to(pipeline.unet.dtype)
+        images = pipeline_calls.controlnet_call(pipeline, [ref_style_prompt, img_generation_prompt],
+                                                image=depth_image,
+                                                num_inference_steps=50,
+                                                controlnet_conditioning_scale=controlnet_conditioning_scale,
+                                                num_images_per_prompt=num_images_per_prompt,
+                                                latents=latents)
+        return [images[0], depth_image] +  images[1:], gr.Image(value=images[0], visible=True)
+    except Exception as e:
+        raise gr.Error(f"Error in generating images:{e}")
+# Create a Gradio UI
 with gr.Blocks() as demo:
     gr.HTML('<h1 style="text-align: center;">Style-aligned with ControlNet Depth</h1>')
     with gr.Row():
       with gr.Column(variant='panel'):
+        # Textbox for reference style prompt
         ref_style_prompt = gr.Textbox(
           label='Reference style prompt',
           info="Enter a Prompt to generate the reference image", placeholder='a poster in <style name> style'
         )
+        # Checkbox for using controller depth-map
         depth_map = gr.Checkbox(label='Depth-map',)
+        # Image display for the generated reference style image
         ref_style_image = gr.Image(visible=False, label='Reference style image')
       with gr.Column(variant='panel'):
+        # Image upload option for uploading a reference image for controlnet
         ref_image = gr.Image(label="Upload the reference image",
                              type='filepath' )
+        # Textbox for ControlNet prompt
         img_generation_prompt = gr.Textbox(
             label='ControlNet Prompt',
             info="Enter a Prompt to generate images using ControlNet and Style-aligned",
             )
+    # Button to trigger image generation
     btn = gr.Button("Generate", size='sm')
+    # Gallery to display generated images
     gallery = gr.Gallery(label="Style-Aligned ControlNet - Generated images",
                            elem_id="gallery",
                            columns=5,
               api_name="style_aligned_controlnet")
+    # Example inputs for the Gradio interface
     gr.Examples(
       examples=[
         ['A poster in a papercut art style.', False, 'example_image/A.png', 'Letter A in a papercut art style.'],
       fn=style_aligned_controlnet,
       )
+# Launch the Gradio demo
 demo.launch()