Spaces:

VikramSingh178
/

picpilot-server

Runtime error

App Files Files Community

VikramSingh178 commited on May 28

Commit

e2ebd5a

•

1 Parent(s): fa32203

chore: Update segmentation model to facebook/sam-vit-huge and adjust prompt and negative prompt for inpainting pipeline

Browse files

Former-commit-id: b412e4a5cd45780b141847a85bdff7761bc9acc0 [formerly 43c409b17e48b30006ded8ee7797a4db47748837]
Former-commit-id: 7849cb5077ff5dde7887367b0b2eee19f1e96b91

Files changed (2) hide show

configs/inpainting.yaml +6 -6
scripts/pipeline.py +8 -8

configs/inpainting.yaml CHANGED Viewed

@@ -1,13 +1,13 @@
-segmentation_model : 'facebook/sam-vit-large'
 detection_model : 'yolov8l'
 model : 'kandinsky-community/kandinsky-2-2-decoder-inpaint'
 target_width : 1920
 target_height : 1080
-prompt : 'product is on the kitchen floor , ultrarealistic lighting , commercial, award , winning photography'
-negative_prompt : 'low resolution , bad resolution'
-roi_scale : 0.5
-strength : 0.7
 guidance_scale : 7.5
-num_inference_steps : 600
 output_path : '../outputs'

+segmentation_model : 'facebook/sam-vit-huge'
 detection_model : 'yolov8l'
 model : 'kandinsky-community/kandinsky-2-2-decoder-inpaint'
 target_width : 1920
 target_height : 1080
+prompt : 'Award Winning Photography of product on a mountain used for camping'
+negative_prompt : 'low resolution , bad resolution, bad quality,bad Artifacts,Weird Artifacts , Poor Lighting'
+roi_scale : 0.6
+strength : 0.2
 guidance_scale : 7.5
+num_inference_steps : 800
 output_path : '../outputs'

scripts/pipeline.py CHANGED Viewed

@@ -3,11 +3,11 @@ from diffusers import AutoPipelineForInpainting
 from diffusers.utils import load_image
 from utils import (accelerator, ImageAugmentation, clear_memory)
 import hydra
-from omegaconf import OmegaConf, DictConfig
 from PIL import Image
 import lightning.pytorch as pl
-pl.seed_everything(42)
-generator = torch.Generator("cuda").manual_seed(92)
 class AutoPaintingPipeline:
     """
@@ -26,7 +26,7 @@ class AutoPaintingPipeline:
         self.image = load_image(image)
         self.mask_image = load_image(mask_image)
         self.pipeline.to(self.device)
-        self.pipeline.unet = torch.compile(self.pipeline.unet, mode="reduce-overhead", fullgraph=True)
     def run_inference(self, prompt: str, negative_prompt: str, num_inference_steps: int, strength: float, guidance_scale: float):
@@ -36,11 +36,11 @@ class AutoPaintingPipeline:
         Returns:
             Image: The output image after inpainting.
         """
         image = load_image(self.image)
         mask_image = load_image(self.mask_image)
-        output = self.pipeline(prompt=prompt,negative_prompt=negative_prompt,image=image,mask_image=mask_image,num_inference_steps=num_inference_steps,strength=strength,guidance_scale =guidance_scale,height = 1472, width = 2560).images[0]
-        clear_memory()
         return output
@@ -54,7 +54,7 @@ def inference(cfg: DictConfig):
     """
     augmenter = ImageAugmentation(target_width=cfg.target_width, target_height=cfg.target_height, roi_scale=cfg.roi_scale)
     model_name = cfg.model
-    image_path = "../sample_data/example3.jpg"
     image = Image.open(image_path)
     extended_image = augmenter.extend_image(image)
     mask_image = augmenter.generate_mask_from_bbox(extended_image, cfg.segmentation_model, cfg.detection_model)

 from diffusers.utils import load_image
 from utils import (accelerator, ImageAugmentation, clear_memory)
 import hydra
+from omegaconf import DictConfig
 from PIL import Image
 import lightning.pytorch as pl
+pl.seed_everything(1234)
 class AutoPaintingPipeline:
     """
         self.image = load_image(image)
         self.mask_image = load_image(mask_image)
         self.pipeline.to(self.device)
     def run_inference(self, prompt: str, negative_prompt: str, num_inference_steps: int, strength: float, guidance_scale: float):
         Returns:
             Image: The output image after inpainting.
         """
+        clear_memory()
         image = load_image(self.image)
         mask_image = load_image(self.mask_image)
+        output = self.pipeline(prompt=prompt,negative_prompt=negative_prompt,image=image,mask_image=mask_image,num_inference_steps=num_inference_steps,strength=strength,guidance_scale=guidance_scale,height = 1472, width = 2560).images[0]
         return output
     """
     augmenter = ImageAugmentation(target_width=cfg.target_width, target_height=cfg.target_height, roi_scale=cfg.roi_scale)
     model_name = cfg.model
+    image_path = "../sample_data/example5.jpg"
     image = Image.open(image_path)
     extended_image = augmenter.extend_image(image)
     mask_image = augmenter.generate_mask_from_bbox(extended_image, cfg.segmentation_model, cfg.detection_model)