Spaces:

Hatman
/

AWS-Nova-Canvas

Running

App Files Files Community

hatmanstack commited on 29 days ago

Commit

1963e4b

•

1 Parent(s): 76f94b4

Fixed tabs

Browse files

Files changed (3) hide show

README.md +27 -21
app.py +387 -61
requirements.txt +1 -2

README.md CHANGED Viewed

@@ -1,3 +1,4 @@
 title: AWS Nova Canvas
 emoji: 🖼️
 colorFrom: blue
@@ -6,35 +7,40 @@ sdk: gradio
 sdk_version: 5.6.0
 app_file: app.py
 pinned: false
-license: apache2.0
 short_description: Generate image variations
-# Amazon Nova Canvas Image Generation
-This Gradio application demonstrates various image generation capabilities using the Amazon Nova Canvas model. The application provides multiple functionalities, each accessible through its own tab, allowing users to generate and manipulate images based on text prompts and other inputs.
-## Features
-- **Text to Image**: Generate an image from a text prompt using the Amazon Nova Canvas model.
-- **Inpainting**: Modify specific areas of an image based on a text prompt.
-- **Outpainting**: Extend an image beyond its original borders using a mask and text prompt.
-- **Image Variation**: Create variations of an image based on a text description.
-- **Image Conditioning**: Generate an image conditioned on an input image and a text prompt.
-- **Color Guided Content**: Generate an image using a color palette from a reference image and a text prompt.
-- **Background Removal**: Remove the background from an image.
-## Usage
-1. **Text to Image**: Enter a descriptive text prompt and click "Generate" to create an image.
-2. **Inpainting**: Upload an image, provide a mask prompt, and click "Generate" to modify specific areas.
-3. **Outpainting**: Upload an image and a mask image, provide a text prompt, and click "Generate" to extend the image.
-4. **Image Variation**: Upload an image, provide a text description, and click "Generate" to create variations.
-5. **Image Conditioning**: Upload an image, provide a text prompt, and click "Generate" to condition the image.
-6. **Color Guided Content**: Upload an image, provide a text prompt and color palette, and click "Generate" to guide content generation.
-7. **Background Removal**: Upload an image and click "Generate" to remove the background.
-## Excellent Documentation
-<p>For more information, visit <a href="https://docs.aws.amazon.com/nova/latest/userguide/what-is-nova.html">AWS Nova documentation</a>.</p>

+---
 title: AWS Nova Canvas
 emoji: 🖼️
 colorFrom: blue
 sdk_version: 5.6.0
 app_file: app.py
 pinned: false
+license: apache-2.0
 short_description: Generate image variations
+---
+# AWS Nova Canvas Image Generation
+A Gradio application for advanced image generation using Amazon Nova Canvas, offering comprehensive image manipulation capabilities.
+## Capabilities
+- **Text to Image**: Generate images from text prompts
+- **Inpainting**: Modify specific image areas
+- **Outpainting**: Extend image boundaries
+- **Image Variation**: Create image variations
+- **Image Conditioning**: Generate images based on input image and text
+- **Color Guided Content**: Create images using reference color palettes
+- **Background Removal**: Remove image backgrounds
+## Prerequisites
+- AWS credentials configured
+- Boto3 Python library
+- Gradio 5.6.0
+## Technical Details
+- Model: Amazon Nova Canvas (amazon.nova-canvas-v1:0)
+- Image Generation Parameters:
+  - Default resolution: 1024x1024
+  - Quality: Standard
+  - CFG Scale: 8.0
+  - Configurable seed
+## Documentation
+For detailed usage, visit [AWS Nova documentation](https://docs.aws.amazon.com/nova/latest/userguide/what-is-nova.html).

app.py CHANGED Viewed

@@ -4,7 +4,10 @@ import json
 import logging
 import boto3
 from PIL import Image
 import gradio as gr
 # Set up logging
 logger = logging.getLogger(__name__)
@@ -16,27 +19,96 @@ class ImageError(Exception):
         self.message = message
 model_id = 'amazon.nova-canvas-v1:0'
 # Function to generate an image using Amazon Nova Canvas model
 def generate_image(body):
     logger.info("Generating image with Amazon Nova Canvas model %s", model_id)
-    session = boto3.Session(aws_access_key_id=aws_id, aws_secret_access_key=aws_secret, region_name='us-east-1')
-    bedrock = session.client('bedrock-runtime')
-    accept = "application/json"
-    content_type = "application/json"
-    response = bedrock.invoke_model(body=body, modelId=model_id, accept=accept, contentType=content_type)
-    response_body = json.loads(response.get("body").read())
-    base64_image = response_body.get("images")[0]
-    base64_bytes = base64_image.encode('ascii')
-    image_bytes = base64.b64decode(base64_bytes)
-    finish_reason = response_body.get("error")
-    if finish_reason is not None:
-        raise ImageError(f"Image generation error. Error is {finish_reason}")
-    logger.info("Successfully generated image with Amazon Nova Canvas model %s", model_id)
-    return image_bytes
 # Function to display image from bytes
 def display_image(image_bytes):
@@ -44,68 +116,229 @@ def display_image(image_bytes):
     return image
 # Gradio functions for each task
-def text_to_image(prompt):
     body = json.dumps({
         "taskType": "TEXT_IMAGE",
-        "textToImageParams": {"text": prompt},
-        "imageGenerationConfig": {"numberOfImages": 1, "height": 1024, "width": 1024, "cfgScale": 8.0, "seed": 0}
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
-def inpainting(image, mask_prompt):
-    input_image = base64.b64encode(image.read()).decode('utf8')
     body = json.dumps({
         "taskType": "INPAINTING",
-        "inPaintingParams": {"text": mask_prompt, "image": input_image, "maskPrompt": "windows"},
-        "imageGenerationConfig": {"numberOfImages": 1, "height": 512, "width": 512, "cfgScale": 8.0}
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
-def outpainting(image, mask_image, text):
-    input_image = base64.b64encode(image.read()).decode('utf8')
-    input_mask_image = base64.b64encode(mask_image.read()).decode('utf8')
     body = json.dumps({
         "taskType": "OUTPAINTING",
-        "outPaintingParams": {"text": text, "image": input_image, "maskImage": input_mask_image, "outPaintingMode": "DEFAULT"},
-        "imageGenerationConfig": {"numberOfImages": 1, "height": 512, "width": 512, "cfgScale": 8.0}
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
-def image_variation(image, text):
-    input_image = base64.b64encode(image.read()).decode('utf8')
     body = json.dumps({
         "taskType": "IMAGE_VARIATION",
-        "imageVariationParams": {"text": text, "images": [input_image], "similarityStrength": 0.7},
-        "imageGenerationConfig": {"numberOfImages": 1, "height": 512, "width": 512, "cfgScale": 8.0}
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
-def image_conditioning(image, text):
-    input_image = base64.b64encode(image.read()).decode('utf8')
     body = json.dumps({
         "taskType": "TEXT_IMAGE",
-        "textToImageParams": {"text": text, "conditionImage": input_image, "controlMode": "CANNY_EDGE"},
-        "imageGenerationConfig": {"numberOfImages": 1, "height": 512, "width": 512, "cfgScale": 8.0}
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
-def color_guided_content(image, text, colors):
-    input_image = base64.b64encode(image.read()).decode('utf8')
     body = json.dumps({
         "taskType": "COLOR_GUIDED_GENERATION",
-        "colorGuidedGenerationParams": {"text": text, "referenceImage": input_image, "colors": colors},
-        "imageGenerationConfig": {"numberOfImages": 1, "height": 512, "width": 512, "cfgScale": 8.0}
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
 def background_removal(image):
-    input_image = base64.b64encode(image.read()).decode('utf8')
     body = json.dumps({
         "taskType": "BACKGROUND_REMOVAL",
         "backgroundRemovalParams": {"image": input_image}
@@ -115,60 +348,153 @@ def background_removal(image):
 # Gradio Interface
 with gr.Blocks() as demo:
     gr.Markdown("# Amazon Nova Canvas Image Generation")
     with gr.Tab("Text to Image"):
         with gr.Column():
             gr.Markdown("Generate an image from a text prompt using the Amazon Nova Canvas model.")
-            prompt = gr.Textbox(label="Prompt")
             output = gr.Image()
-            gr.Button("Generate").click(text_to_image, inputs=prompt, outputs=output)
     with gr.Tab("Inpainting"):
         with gr.Column():
-            gr.Markdown("Use inpainting to modify specific areas of an image based on a text prompt.")
             image = gr.Image(type='pil', label="Input Image")
-            mask_prompt = gr.Textbox(label="Mask Prompt")
             output = gr.Image()
-            gr.Button("Generate").click(inpainting, inputs=[image, mask_prompt], outputs=output)
     with gr.Tab("Outpainting"):
         with gr.Column():
             gr.Markdown("Extend an image beyond its original borders using a mask and text prompt.")
             image = gr.Image(type='pil', label="Input Image")
-            mask_image = gr.Image(type='pil', label="Mask Image")
-            text = gr.Textbox(label="Text")
             output = gr.Image()
-            gr.Button("Generate").click(outpainting, inputs=[image, mask_image, text], outputs=output)
     with gr.Tab("Image Variation"):
         with gr.Column():
-            gr.Markdown("Create variations of an image based on a text description.")
-            image = gr.Image(type='pil', label="Input Image")
-            text = gr.Textbox(label="Text")
             output = gr.Image()
-            gr.Button("Generate").click(image_variation, inputs=[image, text], outputs=output)
     with gr.Tab("Image Conditioning"):
         with gr.Column():
-            gr.Markdown("Generate an image conditioned on an input image and a text prompt.")
-            image = gr.Image(type='pil', label="Input Image")
-            text = gr.Textbox(label="Text")
             output = gr.Image()
-            gr.Button("Generate").click(image_conditioning, inputs=[image, text], outputs=output)
     with gr.Tab("Color Guided Content"):
         with gr.Column():
-            gr.Markdown("Generate an image using a color palette from a reference image and a text prompt.")
-            image = gr.Image(type='pil', label="Input Image")
-            text = gr.Textbox(label="Text")
-            colors = gr.Textbox(label="Colors (comma-separated hex values)")
             output = gr.Image()
-            gr.Button("Generate").click(color_guided_content, inputs=[image, text, colors], outputs=output)
     with gr.Tab("Background Removal"):
         with gr.Column():
-            gr.Markdown("Remove the background from an image.")
             image = gr.Image(type='pil', label="Input Image")
             output = gr.Image()
             gr.Button("Generate").click(background_removal, inputs=image, outputs=output)

 import logging
 import boto3
 from PIL import Image
+from botocore.config import Config
+from botocore.exceptions import ClientError
 import gradio as gr
+import os
 # Set up logging
 logger = logging.getLogger(__name__)
         self.message = message
 model_id = 'amazon.nova-canvas-v1:0'
+aws_id = os.getenv('AWS_ID')
+aws_secret = os.getenv('AWS_SECRET')
+def process_and_encode_image(image, min_size=320, max_size=4096, max_pixels=4194304):
+    if image is None:
+        raise ValueError("Input image is required.")
+    if not isinstance(image, Image.Image):
+        image = Image.open(image)
+    # Convert to RGB mode if necessary
+    if image.mode not in ('RGB', 'RGBA'):
+        image = image.convert('RGB')
+    elif image.mode == 'RGBA':
+        # Convert RGBA to RGB by compositing on white background
+        background = Image.new('RGB', image.size, (255, 255, 255))
+        background.paste(image, mask=image.split()[3])  # Use alpha channel as mask
+        image = background
+    # Ensure 8-bit color depth
+    if image.mode == 'RGB' and isinstance(image.getpixel((0,0)), tuple) and len(image.getpixel((0,0))) == 3:
+        if not all(0 <= x <= 255 for x in image.getpixel((0,0))):
+            image = image.convert('RGB')
+    current_pixels = image.width * image.height
+    # If image exceeds max pixels, scale it down while maintaining aspect ratio
+    if current_pixels > max_pixels:
+        aspect_ratio = image.width / image.height
+        if aspect_ratio > 1:  # Width > Height
+            new_width = int((max_pixels * aspect_ratio) ** 0.5)
+            new_height = int(new_width / aspect_ratio)
+        else:  # Height >= Width
+            new_height = int((max_pixels / aspect_ratio) ** 0.5)
+            new_width = int(new_height * aspect_ratio)
+        image = image.resize((new_width, new_height), Image.LANCZOS)
+    # Ensure dimensions are within valid range
+    if image.width < min_size or image.width > max_size or image.height < min_size or image.height > max_size:
+        new_width = min(max(image.width, min_size), max_size)
+        new_height = min(max(image.height, min_size), max_size)
+        image = image.resize((new_width, new_height), Image.LANCZOS)
+    # Convert to bytes and encode to base64
+    image_bytes = io.BytesIO()
+    # Save as PNG with maximum compatibility
+    image.save(image_bytes, format='PNG', optimize=True)
+    encoded_image = base64.b64encode(image_bytes.getvalue()).decode('utf8')
+    return encoded_image
 # Function to generate an image using Amazon Nova Canvas model
 def generate_image(body):
     logger.info("Generating image with Amazon Nova Canvas model %s", model_id)
+    # Configure the client with a longer timeout
+    bedrock = boto3.client(
+        service_name='bedrock-runtime',
+        aws_access_key_id=aws_id,
+        aws_secret_access_key=aws_secret,
+        region_name='us-east-1',
+        config=Config(read_timeout=300)  # Add 5-minute timeout
+    )
+    print(body)
+    try:
+        response = bedrock.invoke_model(
+            body=body,
+            modelId=model_id,
+            accept="application/json",
+            contentType="application/json"
+        )
+        response_body = json.loads(response.get("body").read())
+        # Check for error before processing the image
+        if "error" in response_body:
+            raise ImageError(f"Image generation error. Error is {response_body['error']}")
+        base64_image = response_body.get("images")[0]
+        base64_bytes = base64_image.encode('ascii')
+        image_bytes = base64.b64decode(base64_bytes)
+        logger.info("Successfully generated image with Amazon Nova Canvas model %s", model_id)
+        return image_bytes
+    except ClientError as err:
+        message = err.response["Error"]["Message"]
+        logger.error("A client error occurred: %s", message)
+        raise ImageError(f"Client error during image generation: {message}")
 # Function to display image from bytes
 def display_image(image_bytes):
     return image
 # Gradio functions for each task
+def text_to_image(prompt, negative_text=None, height=1024, width=1024, quality="standard", cfg_scale=8.0, seed=0):
+    # Prepare the textToImageParams dictionary
+    text_to_image_params = {
+        "text": prompt
+    }
+    # Conditionally add negativeText if it is not None and not empty
+    if negative_text:
+        text_to_image_params["negativeText"] = negative_text
     body = json.dumps({
         "taskType": "TEXT_IMAGE",
+        "textToImageParams": text_to_image_params,
+        "imageGenerationConfig": {
+            "numberOfImages": 1,
+            "height": height,
+            "width": width,
+            "quality": quality,
+            "cfgScale": cfg_scale,
+            "seed": seed
+        }
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
+def inpainting(image, mask_prompt=None, mask_image=None, text=None, negative_text=None, height=1024, width=1024, quality="standard", cfg_scale=8.0, seed=0):
+    if image is not None:
+        input_image = process_and_encode_image(image)
+    else:
+        raise ValueError("Input image is required.")
+    if mask_image is not None:
+        mask_image_encoded = process_and_encode_image(image)
+    else:
+        mask_image_encoded = None
+    if not mask_prompt and not mask_image:
+        raise ValueError("You must specify either maskPrompt or maskImage.")
+    # Prepare the inPaintingParams dictionary
+    if mask_prompt and mask_image_encoded:
+        raise ValueError("You must specify either maskPrompt or maskImage, but not both.")
+    if not mask_prompt and not mask_image_encoded:
+        raise ValueError("You must specify either maskPrompt or maskImage.")
+    # Prepare the inPaintingParams dictionary with the appropriate mask parameter
+    in_painting_params = {
+        "image": input_image
+    }
+    if mask_prompt:
+        in_painting_params["maskPrompt"] = mask_prompt
+    elif mask_image_encoded:
+        in_painting_params["maskImage"] = mask_image_encoded
+    if text:
+        in_painting_params["text"] = text
+    if negative_text:
+        in_painting_params["negativeText"] = negative_text
     body = json.dumps({
         "taskType": "INPAINTING",
+        "inPaintingParams": in_painting_params,
+        "imageGenerationConfig": {
+            "numberOfImages": 1,
+            "height": height,
+            "width": width,
+            "quality": quality,
+            "cfgScale": cfg_scale,
+            "seed": seed
+        }
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
+def outpainting(image, mask_prompt=None, mask_image=None, text=None, negative_text=None, outpainting_mode="DEFAULT", height=1024, width=1024, quality="standard", cfg_scale=8.0, seed=0):
+    if image is not None:
+        input_image = process_and_encode_image(image)
+    else:
+        raise ValueError("Input image is required.")
+    if mask_image is not None:
+        mask_bytes = io.BytesIO()
+        mask_image.save(mask_bytes, format='PNG')
+        mask_image_encoded = base64.b64encode(mask_bytes.getvalue()).decode('utf8')
+    else:
+        mask_image_encoded = None
+    if not mask_prompt and not mask_image:
+        raise ValueError("You must specify either maskPrompt or maskImage.")
+    # Prepare the outPaintingParams dictionary
+    out_painting_params = {
+        "image": input_image,
+        "outPaintingMode": outpainting_mode,
+        "maskPrompt": mask_prompt or ""  # Ensure maskPrompt is always included
+    }
+    # Conditionally add parameters if they are not None
+    if mask_image_encoded:
+        out_painting_params["maskImage"] = mask_image_encoded
+    if text:
+        out_painting_params["text"] = text
+    if negative_text:
+        out_painting_params["negativeText"] = negative_text
     body = json.dumps({
         "taskType": "OUTPAINTING",
+        "outPaintingParams": out_painting_params,
+        "imageGenerationConfig": {
+            "numberOfImages": 1,
+            "height": height,
+            "width": width,
+            "quality": quality,
+            "cfgScale": cfg_scale,
+            "seed": seed
+        }
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
+def image_variation(images, text=None, negative_text=None, similarity_strength=0.5, height=1024, width=1024, quality="standard", cfg_scale=8.0, seed=0):
+    encoded_images = []
+    for image_path in images:
+        with open(image_path, "rb") as image_file:
+            encoded_images.append(process_and_encode_image(image_file))
+    # Prepare the imageVariationParams dictionary
+    image_variation_params = {
+        "images": encoded_images,
+        "similarityStrength": similarity_strength
+    }
+    # Conditionally add parameters if they are not None
+    if text:
+        image_variation_params["text"] = text
+    if negative_text:
+        image_variation_params["negativeText"] = negative_text
     body = json.dumps({
         "taskType": "IMAGE_VARIATION",
+        "imageVariationParams": image_variation_params,
+        "imageGenerationConfig": {
+            "numberOfImages": 1,
+            "height": height,
+            "width": width,
+            "quality": quality,
+            "cfgScale": cfg_scale,
+            "seed": seed
+        }
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
+def image_conditioning(condition_image, text, negative_text=None, control_mode="CANNY_EDGE", control_strength=0.7, height=1024, width=1024, quality="standard", cfg_scale=8.0, seed=0):
+    if condition_image is not None:
+        condition_image_encoded = process_and_encode_image(condition_image)
+    else:
+        raise ValueError("Input image is required.")
+    # Prepare the textToImageParams dictionary
+    text_to_image_params = {
+        "text": text,
+        "conditionImage": condition_image_encoded,
+        "controlMode": control_mode,
+        "controlStrength": control_strength
+    }
+    # Conditionally add negativeText if it is not None
+    if negative_text:
+        text_to_image_params["negativeText"] = negative_text
     body = json.dumps({
         "taskType": "TEXT_IMAGE",
+        "textToImageParams": text_to_image_params,
+        "imageGenerationConfig": {
+            "numberOfImages": 1,
+            "height": height,
+            "width": width,
+            "quality": quality,
+            "cfgScale": cfg_scale,
+            "seed": seed
+        }
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
+def color_guided_content(text=None, reference_image=None, negative_text=None, colors=None, height=1024, width=1024, quality="standard", cfg_scale=8.0, seed=0):
+    # Encode the reference image if provided
+    if reference_image is not None:
+        reference_image_encoded = process_and_encode_image(reference_image)
+    else:
+        reference_image_encoded = None
+    if not colors:
+        colors = "#FF5733,#33FF57,#3357FF,#FF33A1,#33FFF5,#FF8C33,#8C33FF,#33FF8C,#FF3333,#33A1FF"
+    # Prepare the colorGuidedGenerationParams dictionary
+    color_guided_generation_params = {
+        "text": text,
+        "colors": colors.split(',')
+    }
+    # Conditionally add parameters if they are not None
+    if negative_text:
+        color_guided_generation_params["negativeText"] = negative_text
+    if reference_image_encoded:
+        color_guided_generation_params["referenceImage"] = reference_image_encoded
     body = json.dumps({
         "taskType": "COLOR_GUIDED_GENERATION",
+        "colorGuidedGenerationParams": color_guided_generation_params,
+        "imageGenerationConfig": {
+            "numberOfImages": 1,
+            "height": height,
+            "width": width,
+            "quality": quality,
+            "cfgScale": cfg_scale,
+            "seed": seed
+        }
     })
     image_bytes = generate_image(body)
     return display_image(image_bytes)
 def background_removal(image):
+    input_image = process_and_encode_image(image)
     body = json.dumps({
         "taskType": "BACKGROUND_REMOVAL",
         "backgroundRemovalParams": {"image": input_image}
 # Gradio Interface
 with gr.Blocks() as demo:
+    gr.HTML("""
+    <style>
+        #component-0 {
+            max-width: 800px;
+            margin: 0 auto;
+        }
+    </style>
+    """)
     gr.Markdown("# Amazon Nova Canvas Image Generation")
     with gr.Tab("Text to Image"):
         with gr.Column():
             gr.Markdown("Generate an image from a text prompt using the Amazon Nova Canvas model.")
+            prompt = gr.Textbox(label="Prompt", placeholder="Enter a text prompt (1-1024 characters)", max_lines=1)
             output = gr.Image()
+            with gr.Accordion("Advanced Options", open=False):
+                negative_text = gr.Textbox(label="Negative Prompt", placeholder="Enter text to exclude (1-1024 characters)", max_lines=1)
+                height = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Height")
+                width = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Width")
+                quality = gr.Radio(choices=["standard", "premium"], value="standard", label="Quality")
+                cfg_scale = gr.Slider(minimum=1.0, maximum=20.0, step=0.1, value=8.0, label="CFG Scale")
+                seed = gr.Slider(minimum=1, maximum=2000, step=1, value=8, label="Seed")
+            gr.Button("Generate").click(text_to_image, inputs=[prompt, negative_text, height, width, quality, cfg_scale, seed], outputs=output)
     with gr.Tab("Inpainting"):
         with gr.Column():
+            gr.Markdown("""
+            <div style="text-align: center;">
+                Modify specific areas of your image using inpainting. Upload your image and choose one of two ways to specify the areas you want to edit:
+                You can use a photo editing tool to draw masks (using pure black for areas to edit and pure white for areas to preserve) or use the Mask Prompt field to allow the model to infer the mask.
+            </div>
+            """)
             image = gr.Image(type='pil', label="Input Image")
+            mask_prompt = gr.Textbox(label="Mask Prompt", placeholder="Describe regions to edit", max_lines=1)
+            with gr.Accordion("Mask Image", open=False):
+                text = gr.Textbox(label="Text", placeholder="Describe what to generate (1-1024 characters)", max_lines=1)
+                mask_image = gr.Image(type='pil', label="Mask Image")
             output = gr.Image()
+            with gr.Accordion("Advanced Options", open=False):
+                negative_text = gr.Textbox(label="Negative Prompt", placeholder="Describe what not to include (1-1024 characters)", max_lines=1)
+                width = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Width")
+                height = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Height")
+                quality = gr.Radio(choices=["standard", "premium"], value="standard", label="Quality")
+                cfg_scale = gr.Slider(minimum=1.0, maximum=20.0, step=0.1, value=8.0, label="CFG Scale")
+                seed = gr.Slider(minimum=1, maximum=2000, step=1, value=8, label="Seed")
+            gr.Button("Generate").click(inpainting, inputs=[image, mask_prompt, mask_image, text, negative_text, height, width, quality, cfg_scale, seed], outputs=output)
     with gr.Tab("Outpainting"):
         with gr.Column():
             gr.Markdown("Extend an image beyond its original borders using a mask and text prompt.")
+            gr.Markdown("""
+            <div style="text-align: center;">
+                Modify areas outside of your image using outpainting. Upload your image and choose one of two ways to specify the areas you want to edit:
+                You can use a photo editing tool to draw masks extended outside of an images original borders (using pure black for areas to edit and pure
+                white for areas to preserve) or use the Mask Prompt field to allow the model to infer the mask.
+            </div>
+            """)
             image = gr.Image(type='pil', label="Input Image")
+            mask_prompt = gr.Textbox(label="Mask Prompt", placeholder="Describe regions to edit", max_lines=1)
+            with gr.Accordion("Mask Image", open=False):
+                text = gr.Textbox(label="Text", placeholder="Describe what to generate (1-1024 characters)", max_lines=1)
+                mask_image = gr.Image(type='pil', label="Mask Image")
             output = gr.Image()
+            with gr.Accordion("Advanced Options", open=False):
+                negative_text = gr.Textbox(label="Negative Prompt", placeholder="Describe what not to include (1-1024 characters)", max_lines=1)
+                outpainting_mode = gr.Radio(choices=["DEFAULT", "PRECISE"], value="DEFAULT", label="Outpainting Mode")
+                width = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Width")
+                height = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Height")
+                quality = gr.Radio(choices=["standard", "premium"], value="standard", label="Quality")
+                cfg_scale = gr.Slider(minimum=1.0, maximum=20.0, step=0.1, value=8.0, label="CFG Scale")
+                seed = gr.Slider(minimum=1, maximum=2000, step=1, value=8, label="Seed")
+            gr.Button("Generate").click(outpainting, inputs=[image, mask_prompt, mask_image, text, negative_text, outpainting_mode, height, width, quality, cfg_scale, seed], outputs=output)
     with gr.Tab("Image Variation"):
         with gr.Column():
+            gr.Markdown("""
+            <div style="text-align: center;">
+                Create a variation image based on up to 5 other images and a text description (optional).
+                </div>
+            """)
+            images = gr.File(type='filepath', label="Input Images", file_count="multiple", file_types=["image"])
+            text = gr.Textbox(label="Text", placeholder="Enter a text prompt (1-1024 characters)", max_lines=1)
             output = gr.Image()
+            with gr.Accordion("Advanced Options", open=False):
+                negative_text = gr.Textbox(label="Negative Prompt", placeholder="Enter text to exclude (1-1024 characters)", max_lines=1)
+                similarity_strength = gr.Slider(minimum=0.2, maximum=1.0, step=0.1, value=0.7, label="Similarity Strength")
+                width = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Width")
+                height = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Height")
+                quality = gr.Radio(choices=["standard", "premium"], value="standard", label="Quality")
+                cfg_scale = gr.Slider(minimum=1.0, maximum=20.0, step=0.1, value=8.0, label="CFG Scale")
+                seed = gr.Slider(minimum=1, maximum=2000, step=1, value=8, label="Seed")
+            gr.Button("Generate").click(image_variation, inputs=[images, text, negative_text, similarity_strength, height, width, quality, cfg_scale, seed], outputs=output)
     with gr.Tab("Image Conditioning"):
         with gr.Column():
+            gr.Markdown("""
+            <div style="text-align: center;">
+                Generate an image conditioned on an input image and a text prompt (required).
+                </div>
+            """)
+            condition_image = gr.Image(type='pil', label="Condition Image")
+            text = gr.Textbox(label="Text", placeholder="Enter a text prompt (1-1024 characters)", max_lines=1)
             output = gr.Image()
+            with gr.Accordion("Advanced Options", open=False):
+                negative_text = gr.Textbox(label="Negative Prompt", placeholder="Describe what not to include (1-1024 characters)", max_lines=1)
+                control_mode = gr.Radio(choices=["CANNY_EDGE", "SEGMENTATION"], value="CANNY_EDGE", label="Control Mode")
+                control_strength = gr.Slider(minimum=0.0, maximum=1.0, step=0.1, value=0.7, label="Control Strength")
+                width = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Width")
+                height = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Height")
+                quality = gr.Radio(choices=["standard", "premium"], value="standard", label="Quality")
+                cfg_scale = gr.Slider(minimum=1.0, maximum=20.0, step=0.1, value=8.0, label="CFG Scale")
+                seed = gr.Slider(minimum=1, maximum=2000, step=1, value=8, label="Seed")
+            gr.Button("Generate").click(image_conditioning, inputs=[condition_image, text, negative_text, control_mode, control_strength, height, width, quality, cfg_scale, seed], outputs=output)
     with gr.Tab("Color Guided Content"):
         with gr.Column():
+            gr.Markdown("""
+            <div style="text-align: center;">
+                Generate an image using a color palette from a reference image or a text prompt. Starter colors are provided.
+                </div>
+            """)
+            reference_image = gr.Image(type='pil', label="Reference Image")
+            colors = gr.Textbox(label="Colors", placeholder="Enter up to 10 colors as hex values, e.g., #00FF00,#FCF2AB", max_lines=1)
+            text = gr.Textbox(label="Text", placeholder="Enter a text prompt (1-1024 characters)", max_lines=1)
             output = gr.Image()
+            with gr.Accordion("Advanced Options", open=False):
+                negative_text = gr.Textbox(label="Negative Prompt", placeholder="Enter text to exclude (1-1024 characters)", max_lines=1)
+                width = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Width")
+                height = gr.Slider(minimum=256, maximum=2048, step=64, value=1024, label="Height")
+                quality = gr.Radio(choices=["standard", "premium"], value="standard", label="Quality")
+                cfg_scale = gr.Slider(minimum=1.0, maximum=20.0, step=0.1, value=8.0, label="CFG Scale")
+                seed = gr.Slider(minimum=1, maximum=2000, step=1, value=8, label="Seed")
+            gr.Button("Generate").click(color_guided_content, inputs=[text, reference_image, negative_text, colors, height, width, quality, cfg_scale, seed], outputs=output)
     with gr.Tab("Background Removal"):
         with gr.Column():
+            gr.Markdown("""
+            <div style="text-align: center;">
+                Remove the background from an image.
+                </div>
+            """)
             image = gr.Image(type='pil', label="Input Image")
             output = gr.Image()
             gr.Button("Generate").click(background_removal, inputs=image, outputs=output)

requirements.txt CHANGED Viewed

@@ -1,3 +1,2 @@
-spaces
-gradio
 boto3


1	+ Pillow

2	boto3