Spaces:

zdou0830
/

desco

Sleeping

App Files Files Community

zdou0830 commited on Dec 7, 2023

Commit

4798672

•

1 Parent(s): 535364e

nicer

Browse files

Files changed (2) hide show

app.py +4 -2
maskrcnn_benchmark/engine/predictor_glip.py +15 -0

app.py CHANGED Viewed

@@ -85,8 +85,10 @@ gr.Interface(
         ),
     ],
     examples=[
-        ["./1.jpg", "a train besides sidewalk", "train;sidewalk"],
-        ["./2.jpg", "Bumblebee, yellow with black accents.", "Bumblebee"],
     ],
     article=Path("docs/intro.md").read_text()
 ).launch()

         ),
     ],
     examples=[
+        ["./1.jpg", "A clown making a balloon animal for a pretty lady.", "clown"],
+        ["./1.jpg", "A clown kicking a soccer ball for a pretty lady.", "clown"],
+        ["./2.jpg", "A kind of tool, wooden handle with a round head.", "tool"]
+        ["./3.jpg", "Bumblebee, yellow with black accents.", "Bumblebee"],
     ],
     article=Path("docs/intro.md").read_text()
 ).launch()

maskrcnn_benchmark/engine/predictor_glip.py CHANGED Viewed

@@ -16,6 +16,7 @@ from maskrcnn_benchmark.structures.bounding_box import BoxList
 from maskrcnn_benchmark import layers as L
 from maskrcnn_benchmark.modeling.roi_heads.mask_head.inference import Masker
 from maskrcnn_benchmark.utils import cv2_util
 engine = inflect.engine()
 nltk.download("punkt")
@@ -146,6 +147,13 @@ class GLIPDemo(object):
         top_predictions = self._post_process(predictions, thresh)
         result = original_image.copy()
         if self.show_mask_heatmaps:
             return self.create_mask_montage(result, top_predictions)
@@ -261,6 +269,7 @@ class GLIPDemo(object):
         for box, color in zip(boxes, colors):
             box = box.to(torch.int64)
             top_left, bottom_right = box[:2].tolist(), box[2:].tolist()
             new_image = cv2.rectangle(new_image, tuple(top_left), tuple(bottom_right), tuple(color) if override_color is None else tuple(override_color), box_pixel)
         image = cv2.addWeighted(new_image, box_alpha, image, 1 - box_alpha, 0)
@@ -328,6 +337,12 @@ class GLIPDemo(object):
             if int(y) - text_offset_original < 20:
                 y += 50
             cv2.putText(
                 image, s, (int(x), int(y)-text_offset_original),
                 cv2.FONT_HERSHEY_SIMPLEX, text_size,

 from maskrcnn_benchmark import layers as L
 from maskrcnn_benchmark.modeling.roi_heads.mask_head.inference import Masker
 from maskrcnn_benchmark.utils import cv2_util
+from PIL import Image
 engine = inflect.engine()
 nltk.download("punkt")
         top_predictions = self._post_process(predictions, thresh)
         result = original_image.copy()
+        def resize_image_by_height(img, new_height=500):
+            width, height = img.size
+            aspect_ratio = width / height
+            new_width = int(new_height * aspect_ratio)
+            resized_img = img.resize((new_width, new_height), Image.ANTIALIAS)
+            return resized_img
+        result = resize_image_by_height(result)
         if self.show_mask_heatmaps:
             return self.create_mask_montage(result, top_predictions)
         for box, color in zip(boxes, colors):
             box = box.to(torch.int64)
             top_left, bottom_right = box[:2].tolist(), box[2:].tolist()
+            new_image = cv2.rectangle(new_image, tuple(top_left), tuple(bottom_right), tuple(255, 255, 255), box_pixel+3)
             new_image = cv2.rectangle(new_image, tuple(top_left), tuple(bottom_right), tuple(color) if override_color is None else tuple(override_color), box_pixel)
         image = cv2.addWeighted(new_image, box_alpha, image, 1 - box_alpha, 0)
             if int(y) - text_offset_original < 20:
                 y += 50
+            text_size = cv2.getTextSize(s, cv2.FONT_HERSHEY_SIMPLEX, text_size, text_pixel)[0]
+            position = (int(x), int(y)-text_offset_original)
+            bottom_left_corner_of_text = (position[0], position[1] + text_size[1])
+            top_right_corner = (position[0] + text_size[0], position[1])
+            image[position[1]:bottom_left_corner_of_text[1], position[0]:top_right_corner[0]] = (255, 255, 255)
             cv2.putText(
                 image, s, (int(x), int(y)-text_offset_original),
                 cv2.FONT_HERSHEY_SIMPLEX, text_size,