Spaces:

VikramSingh178
/

picpilot-server

Paused

App Files Files Community

VikramSingh178 commited on May 26

Commit

88e9206

•

1 Parent(s): a76141d

refactor: Update import statement for accelerator and image augmentation functionality

Browse files

Files changed (2) hide show

scripts/__pycache__/config.cpython-312.pyc +0 -0
scripts/utils.py +43 -19

scripts/__pycache__/config.cpython-312.pyc ADDED Viewed

Binary file (3.22 kB). View file

scripts/utils.py CHANGED Viewed

@@ -1,8 +1,8 @@
 import torch
 from ultralytics import YOLO
-from transformers import SamModel,SamProcessor
 import numpy as np
-from PIL import Image
 from config import SEGMENTATION_MODEL_NAME
@@ -14,15 +14,14 @@ def accelerator():
         str: The name of the device accelerator ('cuda', 'mps', or 'cpu').
     """
     if torch.cuda.is_available():
-        device = 'cuda'
     elif torch.backends.mps.is_available():
-        device = 'mps'
     else:
-        device = 'cpu'
     return device
 class ImageAugmentation:
     """
     Class for centering an image on a white background using ROI.
@@ -54,7 +53,10 @@ class ImageAugmentation:
         w, h = self.background_size
         bg = np.ones((h, w, 3), dtype=np.uint8) * 255  # White background
         x, y, roi_w, roi_h = roi
-        bg[(h - roi_h) // 2:(h - roi_h) // 2 + roi_h, (w - roi_w) // 2:(w - roi_w) // 2 + roi_w] = image
         return bg
     def detect_region_of_interest(self, image):
@@ -69,11 +71,12 @@ class ImageAugmentation:
         """
         # Convert image to grayscale
         grayscale_image = np.array(Image.fromarray(image).convert("L"))
         # Calculate bounding box of non-zero region
         bbox = Image.fromarray(grayscale_image).getbbox()
         return bbox
 def generate_bbox(image):
     """
     Generate bounding box for the input image.
@@ -85,17 +88,39 @@ def generate_bbox(image):
         tuple: Bounding box coordinates (x, y, width, height).
     """
     # Load YOLOv5 model
-    model = YOLO("yolov8s.pt")
     results = model(image)
     # Get bounding box coordinates
     bbox = results[0].boxes.xyxy.int().tolist()
     return bbox
-def generate_mask():
-    model = SamModel.from_pretrained("SEGMENTATION_MODEL_NAMEz")
-    processor = SamProcessor.from_pretrained("SEGMENTATION_MODEL_NAME")
 if __name__ == "__main__":
@@ -104,8 +129,7 @@ if __name__ == "__main__":
     image = np.array(Image.open(image_path).convert("RGB"))
     roi = augmenter.detect_region_of_interest(image)
     centered_image = augmenter.center_image_on_background(image, roi)
-    bbox = generate_bbox(centered_image)
-    print(bbox)

 import torch
 from ultralytics import YOLO
+from transformers import SamModel, SamProcessor
 import numpy as np
+from PIL import Image
 from config import SEGMENTATION_MODEL_NAME
         str: The name of the device accelerator ('cuda', 'mps', or 'cpu').
     """
     if torch.cuda.is_available():
+        device = "cuda"
     elif torch.backends.mps.is_available():
+        device = "mps"
     else:
+        device = "cpu"
     return device
 class ImageAugmentation:
     """
     Class for centering an image on a white background using ROI.
         w, h = self.background_size
         bg = np.ones((h, w, 3), dtype=np.uint8) * 255  # White background
         x, y, roi_w, roi_h = roi
+        bg[
+            (h - roi_h) // 2 : (h - roi_h) // 2 + roi_h,
+            (w - roi_w) // 2 : (w - roi_w) // 2 + roi_w,
+        ] = image
         return bg
     def detect_region_of_interest(self, image):
         """
         # Convert image to grayscale
         grayscale_image = np.array(Image.fromarray(image).convert("L"))
         # Calculate bounding box of non-zero region
         bbox = Image.fromarray(grayscale_image).getbbox()
         return bbox
 def generate_bbox(image):
     """
     Generate bounding box for the input image.
         tuple: Bounding box coordinates (x, y, width, height).
     """
     # Load YOLOv5 model
+    model = YOLO("../models/yolov8s.pt")
     results = model(image)
     # Get bounding box coordinates
     bbox = results[0].boxes.xyxy.int().tolist()
     return bbox
+def generate_mask(image):
+    """
+    Generates masks for the given image using a segmentation model.
+    Args:
+        image: The input image for which masks need to be generated.
+    Returns:
+        masks: A tensor containing the generated masks.
+    Raises:
+        None
+    """
+    model = SamModel.from_pretrained(SEGMENTATION_MODEL_NAME).to(device=accelerator())
+    processor = SamProcessor.from_pretrained(SEGMENTATION_MODEL_NAME)
+    inputs = processor(
+        image, input_boxes=[generate_bbox(image)], return_tensors="pt"
+    ).to(torch.float)
+    inputs.to(device=accelerator())
+    outputs = model(**inputs)
+    mask = processor.image_processor.post_process_masks(
+        outputs.pred_masks.cpu(),
+        inputs["original_sizes"].cpu(),
+        inputs["reshaped_input_sizes"].cpu(),
+    )
+    return mask
 if __name__ == "__main__":
     image = np.array(Image.open(image_path).convert("RGB"))
     roi = augmenter.detect_region_of_interest(image)
     centered_image = augmenter.center_image_on_background(image, roi)
+    masks = generate_mask(Image.fromarray(centered_image))
+    masks = np.array(masks)
+    mask_image = Image.fromarray(masks[0])
+    mask_image.save("mask.jpg")