Spaces:

wgetdd
/

Stable_Diffusion

Runtime error

App Files Files Community

wgetdd commited on Oct 18, 2023

Commit

46d8cd4

•

1 Parent(s): c324d8c

Added Style embeddings

Browse files

Files changed (19) hide show

app.py +58 -29
main_inference.py +5 -28
requirements.txt +12 -8
style_embeddings/3d_female_cyborgs.bin +0 -0
style_embeddings/80s_anime.bin +0 -0
style_embeddings/anders_zorn.bin +0 -0
style_embeddings/angus_mcbride.bin +0 -0
style_embeddings/breakcore.bin +0 -0
style_embeddings/brittney_williams.bin +0 -0
style_embeddings/buhu_art_style.bin +0 -0
style_embeddings/bull_vs_bear.bin +0 -0
style_embeddings/caitlin_fairchild.bin +0 -0
style_embeddings/exodus_styling.bin +0 -0
style_embeddings/foorbyv2.bin +0 -0
style_embeddings/learned_embeds_arcane.bin +1 -0
style_embeddings/loaded_style_empire.bin +0 -0
style_embeddings/useembeddingname-neg.bin +0 -0
style_embeddings/useembeddingname.bin +0 -0
style_guidence.py +176 -0

app.py CHANGED Viewed

@@ -1,34 +1,48 @@
 import gradio as gr
 from torchvision import transforms
 import torch
-from main_inference import generate_mixed_image, generate_image, progress_video
 import matplotlib.colors as mcolors
-def run_generate_mixed_image(prompt1,prompt2):
-    image = generate_mixed_image(prompt1,prompt2)
     return image
-def run_generate_image(prompt1,noise_checkbox):
-    image = generate_image(prompt1,noised_image=noise_checkbox)
     return image
-def run_generate_image_with_color_doninance(prompt1,color,color_loss_scale,noised_image_checkbox_1):
     # Convert the hexadecimal color code to RGB values
     rgba_color = mcolors.hex2color(color)
     # Multiply the RGB values by 255 to get them in the [0, 255] range
     rgb_values = [int(val * 255) for val in rgba_color]
-    image = generate_image(prompt1,True,color,color_loss_scale,noised_image_checkbox_1)
     return image
-def run_process_video(prompt):
-    # Ask for text input
-    video = progress_video(prompt)
-    return video
 description_text_to_image = """ ### Text to Image Generation
-                1. Write a Text Prompt.
                 2. Output will be an image based on the text prompt provided.
@@ -38,7 +52,7 @@ description_text_to_image = """ ### Text to Image Generation
 description_generate_mixed_image = """ ### Mix Image Generation
-                1. Write Two Text prompts.
                 2. Output will a image which is mix of both of the text provided.
@@ -48,7 +62,7 @@ description_generate_mixed_image = """ ### Mix Image Generation
 description_generate_image_with_color_dominance = """ ### Generate Images with color dominance
-                1. Write a Text Prompt.
                 2. Select a color
@@ -60,11 +74,13 @@ description_generate_image_with_color_dominance = """ ### Generate Images with c
               """
-description_progress_video = """ ### Get the full generation process video
-                1. Write a Text Prompt.
-                2. Output will be the video which contains frames of generated image, during various inference steps
               """
@@ -75,18 +91,26 @@ image_input1 = gr.Image(type='pil')
 image_input2 = gr.Image(type='filepath')
 image_input3 = gr.Image(type='pil')
 image_input4 = gr.Image(type='pil')
 text_input = gr.Text(label="Enter Text Prompt")
 text_input2 = gr.Text(label="Enter Text Prompt")
 text_input3 = gr.Text(label="Enter Text Prompt")
 text_input4 = gr.Text(label = "Enter Text Prompt")
 text_input5 = gr.Text(label = "Enter Text Prompt")
-video_output = gr.Video()
 color = gr.ColorPicker(label="Select a Color",description="Choose a color from the color picker:")
 noised_image_checkbox  = gr.inputs.Checkbox(default=False, label="Show Noised Image")
 noised_image_checkbox_1  = gr.inputs.Checkbox(default=False, label="Show Noised Image")
 noised_image_checkbox_2  = gr.inputs.Checkbox(default=False, label="Show Noised Image")
 color_loss_scale = gr.inputs.Slider(minimum=0, maximum=255, default=40, step=1,label="Color Loss")
 css = "h1 { text-align: center } .about { text-align: justify; padding-left: 10%; padding-right: 10%; }"
 with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
@@ -100,6 +124,7 @@ with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
         with gr.Row(variant="panel"):
             with gr.Column(scale=1):
                 text_input.render()
                 noised_image_checkbox.render()
             with gr.Column(scale=1):
                 image_input1.render()
@@ -118,7 +143,7 @@ with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
                 #             examples_per_page=4)
     run_generate_image_button.click(run_generate_image,
-                        inputs=[text_input,noised_image_checkbox],
                         outputs=image_input1)
     with gr.Tab("Generate Image with Color Dominance"):
@@ -127,6 +152,7 @@ with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
             with gr.Column(scale=1):
                 text_input4.render()
                 color_loss_scale.render()
                 noised_image_checkbox_1.render()
                 color.render()
             with gr.Column(scale=1):
@@ -146,7 +172,7 @@ with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
                 #             examples_per_page=4)
     run_generate_image_with_color_doninance_button.click(run_generate_image_with_color_doninance,
-                        inputs=[text_input4,color,color_loss_scale,noised_image_checkbox_1],
                         outputs=image_input3)
     ####################################################################################################################
@@ -156,6 +182,7 @@ with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
             with gr.Column(scale=1):
                 text_input2.render()
                 text_input3.render()
                 noised_image_checkbox_2.render()
             with gr.Column(scale=1):
                 image_input4.render()
@@ -175,18 +202,20 @@ with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
                 #             examples_per_page=4)
     run_generate_mixed_image_button.click(run_generate_mixed_image,
-                        inputs=[text_input2,text_input3,noised_image_checkbox_2],
                         outputs=image_input4)
     ####################################################################################################################
-    with gr.Tab("progress_video"):
         # Images
         with gr.Row(variant="panel"):
             with gr.Column(scale=1):
                 text_input5.render()
             with gr.Column(scale=1):
-                video_output.render()
         # Submit & Clear
         with gr.Row():
@@ -194,18 +223,18 @@ with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
                 run_progress_video_button = gr.Button("progress_video", variant='primary')
                 clear_btn_progress_video = gr.Button("Clear", variant="secondary")
-                gr.Markdown(description_progress_video)
                 # gr.Examples(examples = ["examples/12830823_87d2654e31.jpg", "examples/27782020_4dab210360.jpg", "examples/44129946_9eeb385d77.jpg"],
                 #             inputs=[text_input5],
-                #             outputs=video_output,
                 #             fn=run_process_video,
                 #             examples_per_page=4)
-    run_progress_video_button.click(run_process_video,
                         inputs=[
-                            text_input5,
                         ],
-                        outputs=video_output)
     #######################################################################################################################
     #######################################################################################################################

 import gradio as gr
 from torchvision import transforms
 import torch
+from main_inference import generate_mixed_image, generate_image
+from style_guidence import generate_with_prompt_style
 import matplotlib.colors as mcolors
+style_file_maps = {
+                   '3D Female Cyborgs':"style_embeddings/3d_female_cyborgs.bin",
+                   '80s Anime':"style_embeddings/80s_anime.bin",
+                   'Anders Zorn':"style_embeddings/anders_zorn.bin",
+                   "Angus Mcbride":"style_embeddings/angus_mcbride.bin",
+                   "Breack Core":"style_embeddings/breakcore.bin",
+                   "Brittney Williams":"style_embeddings/brittney_williams.bin",
+                   "Bull vs Bear":"style_embeddings/bull_vs_bear.bin",
+                   "Caitlin FairChild":"style_embeddings/caitlin_fairchild.bin",
+                   "Exodus Styling":"style_embeddings/exodus_styling.bin",
+                   "FoorByv2":"style_embeddings/foorbyv2.bin"
+                   }
+def run_generate_mixed_image(prompt1,prompt2,num_of_inf_steps,noised_image):
+    image = generate_mixed_image(prompt1,prompt2,num_of_inf_steps,noised_image)
     return image
+def run_generate_image(prompt1,num_of_inf_steps,noise_checkbox):
+    image = generate_image(prompt1,num_inference_steps=num_of_inf_steps,noised_image=noise_checkbox)
     return image
+def run_generate_image_with_color_doninance(prompt1,color,color_loss_scale,num_of_inf_steps,noised_image_checkbox_1):
     # Convert the hexadecimal color code to RGB values
     rgba_color = mcolors.hex2color(color)
     # Multiply the RGB values by 255 to get them in the [0, 255] range
     rgb_values = [int(val * 255) for val in rgba_color]
+    image = generate_image(prompt1,num_of_inf_steps,True,rgb_values,color_loss_scale,noised_image_checkbox_1)
     return image
+def run_generate_image_with_style(prompt,style,num_of_inf_steps):
+    output = generate_with_prompt_style(prompt, style_file_maps[style],num_of_inf_steps)
+    return output
 description_text_to_image = """ ### Text to Image Generation
+                1. Write a Text Prompt and number of inference steps, the more the better results but execution time will be high.
                 2. Output will be an image based on the text prompt provided.
 description_generate_mixed_image = """ ### Mix Image Generation
+                1. Write Two Text prompts and number of inference steps, the more the better results but execution time will be high.
                 2. Output will a image which is mix of both of the text provided.
 description_generate_image_with_color_dominance = """ ### Generate Images with color dominance
+                1. Write a Text Prompt and number of inference steps, the more the better results but execution time will be high.
                 2. Select a color
               """
+description_generate_prompt_with_style = """ ### Get a generated image in the selection of your style
+                1. Write a Text Prompt and number of inference steps, the more the better results but execution time will be high.
+                2. Select a style to dominate the photo
+                3. Get the Output
               """
 image_input2 = gr.Image(type='filepath')
 image_input3 = gr.Image(type='pil')
 image_input4 = gr.Image(type='pil')
+image_input5 = gr.Image(type='pil')
 text_input = gr.Text(label="Enter Text Prompt")
 text_input2 = gr.Text(label="Enter Text Prompt")
 text_input3 = gr.Text(label="Enter Text Prompt")
 text_input4 = gr.Text(label = "Enter Text Prompt")
 text_input5 = gr.Text(label = "Enter Text Prompt")
+num_of_inf_steps_slider1 = gr.inputs.Slider(minimum=0, maximum=50, default=30, step=1,label="Num of Inference Steps")
+num_of_inf_steps_slider2 = gr.inputs.Slider(minimum=0, maximum=50, default=30, step=1,label="Num of Inference Steps")
+num_of_inf_steps_slider3 = gr.inputs.Slider(minimum=0, maximum=50, default=30, step=1,label="Num of Inference Steps")
+num_of_inf_steps_slider4 = gr.inputs.Slider(minimum=0, maximum=50, default=30, step=1,label="Num of Inference Steps")
 color = gr.ColorPicker(label="Select a Color",description="Choose a color from the color picker:")
 noised_image_checkbox  = gr.inputs.Checkbox(default=False, label="Show Noised Image")
 noised_image_checkbox_1  = gr.inputs.Checkbox(default=False, label="Show Noised Image")
 noised_image_checkbox_2  = gr.inputs.Checkbox(default=False, label="Show Noised Image")
+noised_image_checkbox_3  = gr.inputs.Checkbox(default=False, label="Show Noised Image")
 color_loss_scale = gr.inputs.Slider(minimum=0, maximum=255, default=40, step=1,label="Color Loss")
+style_options = ['3D Female Cyborgs', '80s Anime','Anders Zorn',"Angus Mcbride","Breack Core", "Brittney Williams","Bull vs Bear","Caitlin FairChild","Exodus Styling","FoorByv2"]
+selected_style = gr.Dropdown(style_options,label="Select a Style to Follow",default="Anders Zorn")
 css = "h1 { text-align: center } .about { text-align: justify; padding-left: 10%; padding-right: 10%; }"
 with gr.Blocks(css=css, title='Play with Stable Diffusion') as demo:
         with gr.Row(variant="panel"):
             with gr.Column(scale=1):
                 text_input.render()
+                num_of_inf_steps_slider1.render()
                 noised_image_checkbox.render()
             with gr.Column(scale=1):
                 image_input1.render()
                 #             examples_per_page=4)
     run_generate_image_button.click(run_generate_image,
+                        inputs=[text_input,num_of_inf_steps_slider1,noised_image_checkbox],
                         outputs=image_input1)
     with gr.Tab("Generate Image with Color Dominance"):
             with gr.Column(scale=1):
                 text_input4.render()
                 color_loss_scale.render()
+                num_of_inf_steps_slider2.render()
                 noised_image_checkbox_1.render()
                 color.render()
             with gr.Column(scale=1):
                 #             examples_per_page=4)
     run_generate_image_with_color_doninance_button.click(run_generate_image_with_color_doninance,
+                        inputs=[text_input4,color,color_loss_scale,num_of_inf_steps_slider2,noised_image_checkbox_1],
                         outputs=image_input3)
     ####################################################################################################################
             with gr.Column(scale=1):
                 text_input2.render()
                 text_input3.render()
+                num_of_inf_steps_slider3.render()
                 noised_image_checkbox_2.render()
             with gr.Column(scale=1):
                 image_input4.render()
                 #             examples_per_page=4)
     run_generate_mixed_image_button.click(run_generate_mixed_image,
+                        inputs=[text_input2,text_input3,num_of_inf_steps_slider3,noised_image_checkbox_2],
                         outputs=image_input4)
     ####################################################################################################################
+    with gr.Tab("Generate Image with Style"):
         # Images
         with gr.Row(variant="panel"):
             with gr.Column(scale=1):
                 text_input5.render()
+                num_of_inf_steps_slider4.render()
+                selected_style.render()
             with gr.Column(scale=1):
+                image_input5.render()
         # Submit & Clear
         with gr.Row():
                 run_progress_video_button = gr.Button("progress_video", variant='primary')
                 clear_btn_progress_video = gr.Button("Clear", variant="secondary")
+                gr.Markdown(description_generate_prompt_with_style)
                 # gr.Examples(examples = ["examples/12830823_87d2654e31.jpg", "examples/27782020_4dab210360.jpg", "examples/44129946_9eeb385d77.jpg"],
                 #             inputs=[text_input5],
+                #             outputs=image_input5,
                 #             fn=run_process_video,
                 #             examples_per_page=4)
+    run_progress_video_button.click(run_generate_image_with_style,
                         inputs=[
+                            text_input5,selected_style,num_of_inf_steps_slider4
                         ],
+                        outputs=image_input5)
     #######################################################################################################################
     #######################################################################################################################

main_inference.py CHANGED Viewed

@@ -10,8 +10,6 @@ from torchvision import transforms as tfms
 import shutil
 # For video display:
 import cv2
-from IPython.display import HTML
-from base64 import b64encode
 import os
 from utils import color_loss,latents_to_pil,pil_to_latent,sketch_loss
 # Set device
@@ -34,11 +32,11 @@ unet = unet.to(torch_device)
 scheduler.set_timesteps(15)
-def generate_mixed_image(prompt1, prompt2,noised_image=False):
     mix_factor = 0.4 #@param
     height = 512                        # default height of Stable Diffusion
     width = 512                         # default width of Stable Diffusion
-    num_inference_steps = 50  #@param           # Number of denoising steps
     guidance_scale = 8                # Scale for classifier-free guidance
     generator = torch.manual_seed(32)   # Seed generator to create the inital latent noise
     batch_size = 1
@@ -100,12 +98,12 @@ def generate_mixed_image(prompt1, prompt2,noised_image=False):
     return output
-def generate_image(prompt,color_postprocessing=False,postporcessing_color=None,color_loss_scale=40,noised_image=False):
     #@title Store the predicted outputs and next frame for later viewing
     #prompt = 'A campfire (oil on canvas)' #
     height = 512                        # default height of Stable Diffusion
     width = 512                         # default width of Stable Diffusion
-    num_inference_steps = 50  #          # Number of denoising steps
     guidance_scale = 8 #         # Scale for classifier-free guidance
     generator = torch.manual_seed(32)   # Seed generator to create the inital latent noise
     batch_size = 1
@@ -210,26 +208,6 @@ def generate_image(prompt,color_postprocessing=False,postporcessing_color=None,c
     return output
-def progress_video(prompt):
-    pil_image = generate_image(prompt)
-    # Generate a list of image file paths (replace with your own logic)
-    num_frames = len(os.listdir("steps/"))
-    image_files = [f"steps/{i:04d}.jpeg" for i in range(1, num_frames + 1)]
-    # Read the first image to get its size (assuming all images have the same size)
-    first_image = cv2.imread({image_files[0]})
-    height, width, _ = first_image.shape
-    # Define the output video writer
-    fourcc = cv2.VideoWriter_fourcc(*'mp4v')  # Codec for MP4
-    out = cv2.VideoWriter('out.mp4', fourcc, 12, (width, height))
-    for image_file in image_files:
-        frame = cv2.imread(image_file)
-        out.write(frame)
-    out.release()
-    return "out.mp4"
 def generate_noised_version_of_image(pil_image):
     # View a noised version
     encoded = pil_to_latent(pil_image,vae)
@@ -239,6 +217,7 @@ def generate_noised_version_of_image(pil_image):
     return latents_to_pil(encoded_and_noised,vae)[0] # Display
 # if __name__ == "__main__":
 #     prompt = 'A campfire (oil on canvas)'
 #     color_loss_scale = 40
@@ -248,5 +227,3 @@ def generate_noised_version_of_image(pil_image):
 #     #pil_image = generate_noised_version_of_image(Image.open('output.png').resize((512, 512)))
 #     pil_image.save("output1.png")
-if __name__ == "__main__":
-    progress_video("lol")

 import shutil
 # For video display:
 import cv2
 import os
 from utils import color_loss,latents_to_pil,pil_to_latent,sketch_loss
 # Set device
 scheduler.set_timesteps(15)
+def generate_mixed_image(prompt1, prompt2,num_inference_steps=50,noised_image=False):
     mix_factor = 0.4 #@param
     height = 512                        # default height of Stable Diffusion
     width = 512                         # default width of Stable Diffusion
+    num_inference_steps = num_inference_steps  #@param           # Number of denoising steps
     guidance_scale = 8                # Scale for classifier-free guidance
     generator = torch.manual_seed(32)   # Seed generator to create the inital latent noise
     batch_size = 1
     return output
+def generate_image(prompt,num_inference_steps=50,color_postprocessing=False,postporcessing_color=None,color_loss_scale=40,noised_image=False):
     #@title Store the predicted outputs and next frame for later viewing
     #prompt = 'A campfire (oil on canvas)' #
     height = 512                        # default height of Stable Diffusion
     width = 512                         # default width of Stable Diffusion
+    num_inference_steps = num_inference_steps  #          # Number of denoising steps
     guidance_scale = 8 #         # Scale for classifier-free guidance
     generator = torch.manual_seed(32)   # Seed generator to create the inital latent noise
     batch_size = 1
     return output
 def generate_noised_version_of_image(pil_image):
     # View a noised version
     encoded = pil_to_latent(pil_image,vae)
     return latents_to_pil(encoded_and_noised,vae)[0] # Display
 # if __name__ == "__main__":
 #     prompt = 'A campfire (oil on canvas)'
 #     color_loss_scale = 40
 #     #pil_image = generate_noised_version_of_image(Image.open('output.png').resize((512, 512)))
 #     pil_image.save("output1.png")

requirements.txt CHANGED Viewed

@@ -1,8 +1,12 @@
-transformers
-diffusers==0.2.4
-sentence_transformers
-gradio
-torch
-torchvision
-matplotlib
-opencv-python

+diffusers==0.21.4
+gradio==3.49.0
+ipython==8.15.0
+matplotlib==3.8.0
+numpy==1.26.1
+opencv_python==4.8.1.78
+Pillow==10.1.0
+Pillow==10.1.0
+torch==2.1.0
+torchvision==0.16.0
+tqdm==4.66.1
+transformers==4.25.1

style_embeddings/3d_female_cyborgs.bin ADDED Viewed