Spaces:

amos1088
/

test_gradio

Paused

App Files Files Community

amos1088 commited on Oct 29, 2024

Commit

52d3f89

1 Parent(s): 6c3f566

test gradio

Browse files

Files changed (1) hide show

app.py +12 -39

app.py CHANGED Viewed

@@ -1,13 +1,6 @@
 import gradio as gr
 import torch
-from diffusers import (
-    StableDiffusion3Pipeline,  # For SD3 models like Stable Diffusion 3.5
-    ControlNetModel,
-    SD3Transformer2DModel,  # Replacing UNet with SD3 transformer
-    AutoencoderKL,
-    UniPCMultistepScheduler,
-)
-from transformers import CLIPFeatureExtractor, CLIPTextModel, CLIPTokenizer
 from huggingface_hub import login
 import os
@@ -17,41 +10,21 @@ login(token=token)
 # Model IDs for the base Stable Diffusion model and ControlNet variant
 model_id = "stabilityai/stable-diffusion-3.5-large-turbo"
-controlnet_id = "lllyasviel/control_v11p_sd15_inpaint"
-# Load each model component required by the pipeline
-controlnet = ControlNetModel.from_pretrained(controlnet_id, torch_dtype=torch.float16)
-transformer = SD3Transformer2DModel.from_pretrained(model_id, subfolder="transformer", torch_dtype=torch.float16)
-vae = AutoencoderKL.from_pretrained(model_id, subfolder="vae", torch_dtype=torch.float16)
-feature_extractor = CLIPFeatureExtractor.from_pretrained(model_id)
-text_encoder = CLIPTextModel.from_pretrained(model_id, subfolder="text_encoder")
-tokenizer = CLIPTokenizer.from_pretrained(model_id)
-# Initialize the pipeline with all components
-pipeline = StableDiffusion3Pipeline(
-    transformer=transformer,  # Using SD3 transformer
-    vae=vae,
-    text_encoder=text_encoder,
-    tokenizer=tokenizer,
-    controlnet=controlnet,
-    scheduler=UniPCMultistepScheduler.from_config({"name": "UniPCMultistepScheduler"}),
-    feature_extractor=feature_extractor,
-    torch_dtype=torch.float16,
-)
-# Set device for pipeline
-pipeline = pipeline.to("cuda") if torch.cuda.is_available() else pipeline
-# Enable model CPU offloading for memory optimization
-pipeline.enable_model_cpu_offload()
 # Gradio interface function
 def generate_image(prompt, reference_image):
-    # Resize and prepare reference image
     reference_image = reference_image.convert("RGB").resize((512, 512))
-    # Generate image using the pipeline with ControlNet
-    generated_image = pipeline(
         prompt=prompt,
         image=reference_image,
         controlnet_conditioning_scale=1.0,
@@ -68,8 +41,8 @@ interface = gr.Interface(
         gr.Image(type="pil", label="Reference Image (Style)")
     ],
     outputs="image",
-    title="Image Generation with ControlNet (Reference-Only Style Transfer)",
-    description="Generates an image based on a text prompt and style reference image using Stable Diffusion 3.5 and ControlNet (reference-only mode)."
 )
 # Launch the Gradio interface

 import gradio as gr
 import torch
+from diffusers import StableDiffusion3Pipeline, ControlNetModel, UniPCMultistepScheduler
 from huggingface_hub import login
 import os
 # Model IDs for the base Stable Diffusion model and ControlNet variant
 model_id = "stabilityai/stable-diffusion-3.5-large-turbo"
+controlnet_id = "lllyasviel/control_v11p_sd15_inpaint"  # Adjust based on ControlNet needs
+# Load ControlNet and Stable Diffusion models
+controlnet = ControlNetModel.from_pretrained(controlnet_id, torch_dtype=torch.bfloat16)
+pipe = StableDiffusion3Pipeline.from_pretrained(model_id, controlnet=controlnet, torch_dtype=torch.bfloat16)
+pipe.scheduler = UniPCMultistepScheduler.from_config(pipe.scheduler.config)
+pipe = pipe.to("cuda") if torch.cuda.is_available() else pipe
 # Gradio interface function
 def generate_image(prompt, reference_image):
+    # Prepare the reference image
     reference_image = reference_image.convert("RGB").resize((512, 512))
+    # Generate the image using the pipeline with ControlNet
+    generated_image = pipe(
         prompt=prompt,
         image=reference_image,
         controlnet_conditioning_scale=1.0,
         gr.Image(type="pil", label="Reference Image (Style)")
     ],
     outputs="image",
+    title="Image Generation with Stable Diffusion 3.5 and ControlNet",
+    description="Generates an image based on a text prompt and style reference image using Stable Diffusion 3.5 and ControlNet."
 )
 # Launch the Gradio interface