CBNetV2 / patch
hysts's picture
hysts HF staff
Add files
3fe1151
raw
history blame
35.6 kB
diff --git a/configs/cbnet/cascade_rcnn_cbv2d1_r2_101_mdconv_fpn_20e_fp16_ms400-1400_giou_4conv1f_coco.py b/configs/cbnet/cascade_rcnn_cbv2d1_r2_101_mdconv_fpn_20e_fp16_ms400-1400_giou_4conv1f_coco.py
index 167d4379..7c0bd239 100644
--- a/configs/cbnet/cascade_rcnn_cbv2d1_r2_101_mdconv_fpn_20e_fp16_ms400-1400_giou_4conv1f_coco.py
+++ b/configs/cbnet/cascade_rcnn_cbv2d1_r2_101_mdconv_fpn_20e_fp16_ms400-1400_giou_4conv1f_coco.py
@@ -2,9 +2,9 @@ _base_ = '../res2net/cascade_rcnn_r2_101_fpn_20e_coco.py'
model = dict(
backbone=dict(
- type='CBRes2Net',
+ type='CBRes2Net',
cb_del_stages=1,
- cb_inplanes=[64, 256, 512, 1024, 2048],
+ cb_inplanes=[64, 256, 512, 1024, 2048],
dcn=dict(type='DCNv2', deform_groups=1, fallback_on_stride=False),
stage_with_dcn=(False, True, True, True)
),
@@ -28,7 +28,7 @@ model = dict(
target_stds=[0.1, 0.1, 0.2, 0.2]),
reg_class_agnostic=False,
reg_decoded_bbox=True,
- norm_cfg=dict(type='SyncBN', requires_grad=True),
+ norm_cfg=dict(type='BN', requires_grad=True),
loss_cls=dict(
type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
@@ -47,7 +47,7 @@ model = dict(
target_stds=[0.05, 0.05, 0.1, 0.1]),
reg_class_agnostic=False,
reg_decoded_bbox=True,
- norm_cfg=dict(type='SyncBN', requires_grad=True),
+ norm_cfg=dict(type='BN', requires_grad=True),
loss_cls=dict(
type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
@@ -66,7 +66,7 @@ model = dict(
target_stds=[0.033, 0.033, 0.067, 0.067]),
reg_class_agnostic=False,
reg_decoded_bbox=True,
- norm_cfg=dict(type='SyncBN', requires_grad=True),
+ norm_cfg=dict(type='BN', requires_grad=True),
loss_cls=dict(
type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
diff --git a/configs/cbnet/htc_cbv2_swin_base_patch4_window7_mstrain_400-1400_giou_4conv1f_adamw_20e_coco.py b/configs/cbnet/htc_cbv2_swin_base_patch4_window7_mstrain_400-1400_giou_4conv1f_adamw_20e_coco.py
index 51edfd62..a7434c5d 100644
--- a/configs/cbnet/htc_cbv2_swin_base_patch4_window7_mstrain_400-1400_giou_4conv1f_adamw_20e_coco.py
+++ b/configs/cbnet/htc_cbv2_swin_base_patch4_window7_mstrain_400-1400_giou_4conv1f_adamw_20e_coco.py
@@ -18,7 +18,7 @@ model = dict(
target_stds=[0.1, 0.1, 0.2, 0.2]),
reg_class_agnostic=True,
reg_decoded_bbox=True,
- norm_cfg=dict(type='SyncBN', requires_grad=True),
+ norm_cfg=dict(type='BN', requires_grad=True),
loss_cls=dict(
type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
@@ -37,7 +37,7 @@ model = dict(
target_stds=[0.05, 0.05, 0.1, 0.1]),
reg_class_agnostic=True,
reg_decoded_bbox=True,
- norm_cfg=dict(type='SyncBN', requires_grad=True),
+ norm_cfg=dict(type='BN', requires_grad=True),
loss_cls=dict(
type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
@@ -56,7 +56,7 @@ model = dict(
target_stds=[0.033, 0.033, 0.067, 0.067]),
reg_class_agnostic=True,
reg_decoded_bbox=True,
- norm_cfg=dict(type='SyncBN', requires_grad=True),
+ norm_cfg=dict(type='BN', requires_grad=True),
loss_cls=dict(
type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
diff --git a/mmdet/__init__.py b/mmdet/__init__.py
index 646ee84e..9e846286 100644
--- a/mmdet/__init__.py
+++ b/mmdet/__init__.py
@@ -20,9 +20,9 @@ mmcv_maximum_version = '1.4.0'
mmcv_version = digit_version(mmcv.__version__)
-assert (mmcv_version >= digit_version(mmcv_minimum_version)
- and mmcv_version <= digit_version(mmcv_maximum_version)), \
- f'MMCV=={mmcv.__version__} is used but incompatible. ' \
- f'Please install mmcv>={mmcv_minimum_version}, <={mmcv_maximum_version}.'
+#assert (mmcv_version >= digit_version(mmcv_minimum_version)
+# and mmcv_version <= digit_version(mmcv_maximum_version)), \
+# f'MMCV=={mmcv.__version__} is used but incompatible. ' \
+# f'Please install mmcv>={mmcv_minimum_version}, <={mmcv_maximum_version}.'
__all__ = ['__version__', 'short_version']
diff --git a/mmdet/core/mask/structures.py b/mmdet/core/mask/structures.py
index 6f5a62ae..a9d0ebb4 100644
--- a/mmdet/core/mask/structures.py
+++ b/mmdet/core/mask/structures.py
@@ -1,3 +1,4 @@
+# Copyright (c) OpenMMLab. All rights reserved.
from abc import ABCMeta, abstractmethod
import cv2
@@ -528,6 +529,21 @@ class BitmapMasks(BaseInstanceMasks):
self = cls(masks, height=height, width=width)
return self
+ def get_bboxes(self):
+ num_masks = len(self)
+ boxes = np.zeros((num_masks, 4), dtype=np.float32)
+ x_any = self.masks.any(axis=1)
+ y_any = self.masks.any(axis=2)
+ for idx in range(num_masks):
+ x = np.where(x_any[idx, :])[0]
+ y = np.where(y_any[idx, :])[0]
+ if len(x) > 0 and len(y) > 0:
+ # use +1 for x_max and y_max so that the right and bottom
+ # boundary of instance masks are fully included by the box
+ boxes[idx, :] = np.array([x[0], y[0], x[-1] + 1, y[-1] + 1],
+ dtype=np.float32)
+ return boxes
+
class PolygonMasks(BaseInstanceMasks):
"""This class represents masks in the form of polygons.
@@ -637,8 +653,8 @@ class PolygonMasks(BaseInstanceMasks):
resized_poly = []
for p in poly_per_obj:
p = p.copy()
- p[0::2] *= w_scale
- p[1::2] *= h_scale
+ p[0::2] = p[0::2] * w_scale
+ p[1::2] = p[1::2] * h_scale
resized_poly.append(p)
resized_masks.append(resized_poly)
resized_masks = PolygonMasks(resized_masks, *out_shape)
@@ -690,8 +706,8 @@ class PolygonMasks(BaseInstanceMasks):
for p in poly_per_obj:
# pycocotools will clip the boundary
p = p.copy()
- p[0::2] -= bbox[0]
- p[1::2] -= bbox[1]
+ p[0::2] = p[0::2] - bbox[0]
+ p[1::2] = p[1::2] - bbox[1]
cropped_poly_per_obj.append(p)
cropped_masks.append(cropped_poly_per_obj)
cropped_masks = PolygonMasks(cropped_masks, h, w)
@@ -736,12 +752,12 @@ class PolygonMasks(BaseInstanceMasks):
p = p.copy()
# crop
# pycocotools will clip the boundary
- p[0::2] -= bbox[0]
- p[1::2] -= bbox[1]
+ p[0::2] = p[0::2] - bbox[0]
+ p[1::2] = p[1::2] - bbox[1]
# resize
- p[0::2] *= w_scale
- p[1::2] *= h_scale
+ p[0::2] = p[0::2] * w_scale
+ p[1::2] = p[1::2] * h_scale
resized_mask.append(p)
resized_masks.append(resized_mask)
return PolygonMasks(resized_masks, *out_shape)
@@ -944,6 +960,7 @@ class PolygonMasks(BaseInstanceMasks):
a list of vertices, in CCW order.
"""
from scipy.stats import truncnorm
+
# Generate around the unit circle
cx, cy = (0.0, 0.0)
radius = 1
@@ -1019,6 +1036,24 @@ class PolygonMasks(BaseInstanceMasks):
self = cls(masks, height, width)
return self
+ def get_bboxes(self):
+ num_masks = len(self)
+ boxes = np.zeros((num_masks, 4), dtype=np.float32)
+ for idx, poly_per_obj in enumerate(self.masks):
+ # simply use a number that is big enough for comparison with
+ # coordinates
+ xy_min = np.array([self.width * 2, self.height * 2],
+ dtype=np.float32)
+ xy_max = np.zeros(2, dtype=np.float32)
+ for p in poly_per_obj:
+ xy = np.array(p).reshape(-1, 2).astype(np.float32)
+ xy_min = np.minimum(xy_min, np.min(xy, axis=0))
+ xy_max = np.maximum(xy_max, np.max(xy, axis=0))
+ boxes[idx, :2] = xy_min
+ boxes[idx, 2:] = xy_max
+
+ return boxes
+
def polygon_to_bitmap(polygons, height, width):
"""Convert masks from the form of polygons to bitmaps.
@@ -1035,3 +1070,33 @@ def polygon_to_bitmap(polygons, height, width):
rle = maskUtils.merge(rles)
bitmap_mask = maskUtils.decode(rle).astype(np.bool)
return bitmap_mask
+
+
+def bitmap_to_polygon(bitmap):
+ """Convert masks from the form of bitmaps to polygons.
+
+ Args:
+ bitmap (ndarray): masks in bitmap representation.
+
+ Return:
+ list[ndarray]: the converted mask in polygon representation.
+ bool: whether the mask has holes.
+ """
+ bitmap = np.ascontiguousarray(bitmap).astype(np.uint8)
+ # cv2.RETR_CCOMP: retrieves all of the contours and organizes them
+ # into a two-level hierarchy. At the top level, there are external
+ # boundaries of the components. At the second level, there are
+ # boundaries of the holes. If there is another contour inside a hole
+ # of a connected component, it is still put at the top level.
+ # cv2.CHAIN_APPROX_NONE: stores absolutely all the contour points.
+ outs = cv2.findContours(bitmap, cv2.RETR_CCOMP, cv2.CHAIN_APPROX_NONE)
+ contours = outs[-2]
+ hierarchy = outs[-1]
+ if hierarchy is None:
+ return [], False
+ # hierarchy[i]: 4 elements, for the indexes of next, previous,
+ # parent, or nested contours. If there is no corresponding contour,
+ # it will be -1.
+ with_hole = (hierarchy.reshape(-1, 4)[:, 3] >= 0).any()
+ contours = [c.reshape(-1, 2) for c in contours]
+ return contours, with_hole
diff --git a/mmdet/core/visualization/image.py b/mmdet/core/visualization/image.py
index 5a148384..66f82a38 100644
--- a/mmdet/core/visualization/image.py
+++ b/mmdet/core/visualization/image.py
@@ -1,3 +1,5 @@
+# Copyright (c) OpenMMLab. All rights reserved.
+import cv2
import matplotlib.pyplot as plt
import mmcv
import numpy as np
@@ -5,17 +7,25 @@ import pycocotools.mask as mask_util
from matplotlib.collections import PatchCollection
from matplotlib.patches import Polygon
+#from mmdet.core.evaluation.panoptic_utils import INSTANCE_OFFSET
+from ..mask.structures import bitmap_to_polygon
from ..utils import mask2ndarray
+from .palette import get_palette, palette_val
+
+__all__ = [
+ 'color_val_matplotlib', 'draw_masks', 'draw_bboxes', 'draw_labels',
+ 'imshow_det_bboxes', 'imshow_gt_det_bboxes'
+]
EPS = 1e-2
def color_val_matplotlib(color):
"""Convert various input in BGR order to normalized RGB matplotlib color
- tuples,
+ tuples.
Args:
- color (:obj:`Color`/str/tuple/int/ndarray): Color inputs
+ color (:obj`Color` | str | tuple | int | ndarray): Color inputs.
Returns:
tuple[float]: A tuple of 3 normalized floats indicating RGB channels.
@@ -25,9 +35,177 @@ def color_val_matplotlib(color):
return tuple(color)
+def _get_adaptive_scales(areas, min_area=800, max_area=30000):
+ """Get adaptive scales according to areas.
+
+ The scale range is [0.5, 1.0]. When the area is less than
+ ``'min_area'``, the scale is 0.5 while the area is larger than
+ ``'max_area'``, the scale is 1.0.
+
+ Args:
+ areas (ndarray): The areas of bboxes or masks with the
+ shape of (n, ).
+ min_area (int): Lower bound areas for adaptive scales.
+ Default: 800.
+ max_area (int): Upper bound areas for adaptive scales.
+ Default: 30000.
+
+ Returns:
+ ndarray: The adaotive scales with the shape of (n, ).
+ """
+ scales = 0.5 + (areas - min_area) / (max_area - min_area)
+ scales = np.clip(scales, 0.5, 1.0)
+ return scales
+
+
+def _get_bias_color(base, max_dist=30):
+ """Get different colors for each masks.
+
+ Get different colors for each masks by adding a bias
+ color to the base category color.
+ Args:
+ base (ndarray): The base category color with the shape
+ of (3, ).
+ max_dist (int): The max distance of bias. Default: 30.
+
+ Returns:
+ ndarray: The new color for a mask with the shape of (3, ).
+ """
+ new_color = base + np.random.randint(
+ low=-max_dist, high=max_dist + 1, size=3)
+ return np.clip(new_color, 0, 255, new_color)
+
+
+def draw_bboxes(ax, bboxes, color='g', alpha=0.8, thickness=2):
+ """Draw bounding boxes on the axes.
+
+ Args:
+ ax (matplotlib.Axes): The input axes.
+ bboxes (ndarray): The input bounding boxes with the shape
+ of (n, 4).
+ color (list[tuple] | matplotlib.color): the colors for each
+ bounding boxes.
+ alpha (float): Transparency of bounding boxes. Default: 0.8.
+ thickness (int): Thickness of lines. Default: 2.
+
+ Returns:
+ matplotlib.Axes: The result axes.
+ """
+ polygons = []
+ for i, bbox in enumerate(bboxes):
+ bbox_int = bbox.astype(np.int32)
+ poly = [[bbox_int[0], bbox_int[1]], [bbox_int[0], bbox_int[3]],
+ [bbox_int[2], bbox_int[3]], [bbox_int[2], bbox_int[1]]]
+ np_poly = np.array(poly).reshape((4, 2))
+ polygons.append(Polygon(np_poly))
+ p = PatchCollection(
+ polygons,
+ facecolor='none',
+ edgecolors=color,
+ linewidths=thickness,
+ alpha=alpha)
+ ax.add_collection(p)
+
+ return ax
+
+
+def draw_labels(ax,
+ labels,
+ positions,
+ scores=None,
+ class_names=None,
+ color='w',
+ font_size=8,
+ scales=None,
+ horizontal_alignment='left'):
+ """Draw labels on the axes.
+
+ Args:
+ ax (matplotlib.Axes): The input axes.
+ labels (ndarray): The labels with the shape of (n, ).
+ positions (ndarray): The positions to draw each labels.
+ scores (ndarray): The scores for each labels.
+ class_names (list[str]): The class names.
+ color (list[tuple] | matplotlib.color): The colors for labels.
+ font_size (int): Font size of texts. Default: 8.
+ scales (list[float]): Scales of texts. Default: None.
+ horizontal_alignment (str): The horizontal alignment method of
+ texts. Default: 'left'.
+
+ Returns:
+ matplotlib.Axes: The result axes.
+ """
+ for i, (pos, label) in enumerate(zip(positions, labels)):
+ label_text = class_names[
+ label] if class_names is not None else f'class {label}'
+ if scores is not None:
+ label_text += f'|{scores[i]:.02f}'
+ text_color = color[i] if isinstance(color, list) else color
+
+ font_size_mask = font_size if scales is None else font_size * scales[i]
+ ax.text(
+ pos[0],
+ pos[1],
+ f'{label_text}',
+ bbox={
+ 'facecolor': 'black',
+ 'alpha': 0.8,
+ 'pad': 0.7,
+ 'edgecolor': 'none'
+ },
+ color=text_color,
+ fontsize=font_size_mask,
+ verticalalignment='top',
+ horizontalalignment=horizontal_alignment)
+
+ return ax
+
+
+def draw_masks(ax, img, masks, color=None, with_edge=True, alpha=0.8):
+ """Draw masks on the image and their edges on the axes.
+
+ Args:
+ ax (matplotlib.Axes): The input axes.
+ img (ndarray): The image with the shape of (3, h, w).
+ masks (ndarray): The masks with the shape of (n, h, w).
+ color (ndarray): The colors for each masks with the shape
+ of (n, 3).
+ with_edge (bool): Whether to draw edges. Default: True.
+ alpha (float): Transparency of bounding boxes. Default: 0.8.
+
+ Returns:
+ matplotlib.Axes: The result axes.
+ ndarray: The result image.
+ """
+ taken_colors = set([0, 0, 0])
+ if color is None:
+ random_colors = np.random.randint(0, 255, (masks.size(0), 3))
+ color = [tuple(c) for c in random_colors]
+ color = np.array(color, dtype=np.uint8)
+ polygons = []
+ for i, mask in enumerate(masks):
+ if with_edge:
+ contours, _ = bitmap_to_polygon(mask)
+ polygons += [Polygon(c) for c in contours]
+
+ color_mask = color[i]
+ while tuple(color_mask) in taken_colors:
+ color_mask = _get_bias_color(color_mask)
+ taken_colors.add(tuple(color_mask))
+
+ mask = mask.astype(bool)
+ img[mask] = img[mask] * (1 - alpha) + color_mask * alpha
+
+ p = PatchCollection(
+ polygons, facecolor='none', edgecolors='w', linewidths=1, alpha=0.8)
+ ax.add_collection(p)
+
+ return ax, img
+
+
def imshow_det_bboxes(img,
- bboxes,
- labels,
+ bboxes=None,
+ labels=None,
segms=None,
class_names=None,
score_thr=0,
@@ -35,7 +213,7 @@ def imshow_det_bboxes(img,
text_color='green',
mask_color=None,
thickness=2,
- font_size=13,
+ font_size=8,
win_name='',
show=True,
wait_time=0,
@@ -43,43 +221,51 @@ def imshow_det_bboxes(img,
"""Draw bboxes and class labels (with scores) on an image.
Args:
- img (str or ndarray): The image to be displayed.
+ img (str | ndarray): The image to be displayed.
bboxes (ndarray): Bounding boxes (with scores), shaped (n, 4) or
(n, 5).
labels (ndarray): Labels of bboxes.
- segms (ndarray or None): Masks, shaped (n,h,w) or None
+ segms (ndarray | None): Masks, shaped (n,h,w) or None.
class_names (list[str]): Names of each classes.
- score_thr (float): Minimum score of bboxes to be shown. Default: 0
- bbox_color (str or tuple(int) or :obj:`Color`):Color of bbox lines.
- The tuple of color should be in BGR order. Default: 'green'
- text_color (str or tuple(int) or :obj:`Color`):Color of texts.
- The tuple of color should be in BGR order. Default: 'green'
- mask_color (str or tuple(int) or :obj:`Color`, optional):
- Color of masks. The tuple of color should be in BGR order.
- Default: None
- thickness (int): Thickness of lines. Default: 2
- font_size (int): Font size of texts. Default: 13
- show (bool): Whether to show the image. Default: True
- win_name (str): The window name. Default: ''
+ score_thr (float): Minimum score of bboxes to be shown. Default: 0.
+ bbox_color (list[tuple] | tuple | str | None): Colors of bbox lines.
+ If a single color is given, it will be applied to all classes.
+ The tuple of color should be in RGB order. Default: 'green'.
+ text_color (list[tuple] | tuple | str | None): Colors of texts.
+ If a single color is given, it will be applied to all classes.
+ The tuple of color should be in RGB order. Default: 'green'.
+ mask_color (list[tuple] | tuple | str | None, optional): Colors of
+ masks. If a single color is given, it will be applied to all
+ classes. The tuple of color should be in RGB order.
+ Default: None.
+ thickness (int): Thickness of lines. Default: 2.
+ font_size (int): Font size of texts. Default: 13.
+ show (bool): Whether to show the image. Default: True.
+ win_name (str): The window name. Default: ''.
wait_time (float): Value of waitKey param. Default: 0.
out_file (str, optional): The filename to write the image.
- Default: None
+ Default: None.
Returns:
ndarray: The image with bboxes drawn on it.
"""
- assert bboxes.ndim == 2, \
+ assert bboxes is None or bboxes.ndim == 2, \
f' bboxes ndim should be 2, but its ndim is {bboxes.ndim}.'
assert labels.ndim == 1, \
f' labels ndim should be 1, but its ndim is {labels.ndim}.'
- assert bboxes.shape[0] == labels.shape[0], \
- 'bboxes.shape[0] and labels.shape[0] should have the same length.'
- assert bboxes.shape[1] == 4 or bboxes.shape[1] == 5, \
+ assert bboxes is None or bboxes.shape[1] == 4 or bboxes.shape[1] == 5, \
f' bboxes.shape[1] should be 4 or 5, but its {bboxes.shape[1]}.'
+ assert bboxes is None or bboxes.shape[0] <= labels.shape[0], \
+ 'labels.shape[0] should not be less than bboxes.shape[0].'
+ assert segms is None or segms.shape[0] == labels.shape[0], \
+ 'segms.shape[0] and labels.shape[0] should have the same length.'
+ assert segms is not None or bboxes is not None, \
+ 'segms and bboxes should not be None at the same time.'
+
img = mmcv.imread(img).astype(np.uint8)
if score_thr > 0:
- assert bboxes.shape[1] == 5
+ assert bboxes is not None and bboxes.shape[1] == 5
scores = bboxes[:, -1]
inds = scores > score_thr
bboxes = bboxes[inds, :]
@@ -87,25 +273,6 @@ def imshow_det_bboxes(img,
if segms is not None:
segms = segms[inds, ...]
- mask_colors = []
- if labels.shape[0] > 0:
- if mask_color is None:
- # random color
- np.random.seed(42)
- mask_colors = [
- np.random.randint(0, 256, (1, 3), dtype=np.uint8)
- for _ in range(max(labels) + 1)
- ]
- else:
- # specify color
- mask_colors = [
- np.array(mmcv.color_val(mask_color)[::-1], dtype=np.uint8)
- ] * (
- max(labels) + 1)
-
- bbox_color = color_val_matplotlib(bbox_color)
- text_color = color_val_matplotlib(text_color)
-
img = mmcv.bgr2rgb(img)
width, height = img.shape[1], img.shape[0]
img = np.ascontiguousarray(img)
@@ -123,44 +290,64 @@ def imshow_det_bboxes(img,
ax = plt.gca()
ax.axis('off')
- polygons = []
- color = []
- for i, (bbox, label) in enumerate(zip(bboxes, labels)):
- bbox_int = bbox.astype(np.int32)
- poly = [[bbox_int[0], bbox_int[1]], [bbox_int[0], bbox_int[3]],
- [bbox_int[2], bbox_int[3]], [bbox_int[2], bbox_int[1]]]
- np_poly = np.array(poly).reshape((4, 2))
- polygons.append(Polygon(np_poly))
- color.append(bbox_color)
- label_text = class_names[
- label] if class_names is not None else f'class {label}'
- if len(bbox) > 4:
- label_text += f'|{bbox[-1]:.02f}'
- ax.text(
- bbox_int[0],
- bbox_int[1],
- f'{label_text}',
- bbox={
- 'facecolor': 'black',
- 'alpha': 0.8,
- 'pad': 0.7,
- 'edgecolor': 'none'
- },
- color=text_color,
- fontsize=font_size,
- verticalalignment='top',
- horizontalalignment='left')
- if segms is not None:
- color_mask = mask_colors[labels[i]]
- mask = segms[i].astype(bool)
- img[mask] = img[mask] * 0.5 + color_mask * 0.5
+ max_label = int(max(labels) if len(labels) > 0 else 0)
+ text_palette = palette_val(get_palette(text_color, max_label + 1))
+ text_colors = [text_palette[label] for label in labels]
+
+ num_bboxes = 0
+ if bboxes is not None:
+ num_bboxes = bboxes.shape[0]
+ bbox_palette = palette_val(get_palette(bbox_color, max_label + 1))
+ colors = [bbox_palette[label] for label in labels[:num_bboxes]]
+ draw_bboxes(ax, bboxes, colors, alpha=0.8, thickness=thickness)
+
+ horizontal_alignment = 'left'
+ positions = bboxes[:, :2].astype(np.int32) + thickness
+ areas = (bboxes[:, 3] - bboxes[:, 1]) * (bboxes[:, 2] - bboxes[:, 0])
+ scales = _get_adaptive_scales(areas)
+ scores = bboxes[:, 4] if bboxes.shape[1] == 5 else None
+ draw_labels(
+ ax,
+ labels[:num_bboxes],
+ positions,
+ scores=scores,
+ class_names=class_names,
+ color=text_colors,
+ font_size=font_size,
+ scales=scales,
+ horizontal_alignment=horizontal_alignment)
+
+ if segms is not None:
+ mask_palette = get_palette(mask_color, max_label + 1)
+ colors = [mask_palette[label] for label in labels]
+ colors = np.array(colors, dtype=np.uint8)
+ draw_masks(ax, img, segms, colors, with_edge=True)
+
+ if num_bboxes < segms.shape[0]:
+ segms = segms[num_bboxes:]
+ horizontal_alignment = 'center'
+ areas = []
+ positions = []
+ for mask in segms:
+ _, _, stats, centroids = cv2.connectedComponentsWithStats(
+ mask.astype(np.uint8), connectivity=8)
+ largest_id = np.argmax(stats[1:, -1]) + 1
+ positions.append(centroids[largest_id])
+ areas.append(stats[largest_id, -1])
+ areas = np.stack(areas, axis=0)
+ scales = _get_adaptive_scales(areas)
+ draw_labels(
+ ax,
+ labels[num_bboxes:],
+ positions,
+ class_names=class_names,
+ color=text_colors,
+ font_size=font_size,
+ scales=scales,
+ horizontal_alignment=horizontal_alignment)
plt.imshow(img)
- p = PatchCollection(
- polygons, facecolor='none', edgecolors=color, linewidths=thickness)
- ax.add_collection(p)
-
stream, _ = canvas.print_to_buffer()
buffer = np.frombuffer(stream, dtype='uint8')
img_rgba = buffer.reshape(height, width, 4)
@@ -191,12 +378,12 @@ def imshow_gt_det_bboxes(img,
result,
class_names=None,
score_thr=0,
- gt_bbox_color=(255, 102, 61),
- gt_text_color=(255, 102, 61),
- gt_mask_color=(255, 102, 61),
- det_bbox_color=(72, 101, 241),
- det_text_color=(72, 101, 241),
- det_mask_color=(72, 101, 241),
+ gt_bbox_color=(61, 102, 255),
+ gt_text_color=(200, 200, 200),
+ gt_mask_color=(61, 102, 255),
+ det_bbox_color=(241, 101, 72),
+ det_text_color=(200, 200, 200),
+ det_mask_color=(241, 101, 72),
thickness=2,
font_size=13,
win_name='',
@@ -206,54 +393,75 @@ def imshow_gt_det_bboxes(img,
"""General visualization GT and result function.
Args:
- img (str or ndarray): The image to be displayed.)
+ img (str | ndarray): The image to be displayed.
annotation (dict): Ground truth annotations where contain keys of
- 'gt_bboxes' and 'gt_labels' or 'gt_masks'
- result (tuple[list] or list): The detection result, can be either
+ 'gt_bboxes' and 'gt_labels' or 'gt_masks'.
+ result (tuple[list] | list): The detection result, can be either
(bbox, segm) or just bbox.
class_names (list[str]): Names of each classes.
- score_thr (float): Minimum score of bboxes to be shown. Default: 0
- gt_bbox_color (str or tuple(int) or :obj:`Color`):Color of bbox lines.
- The tuple of color should be in BGR order. Default: (255, 102, 61)
- gt_text_color (str or tuple(int) or :obj:`Color`):Color of texts.
- The tuple of color should be in BGR order. Default: (255, 102, 61)
- gt_mask_color (str or tuple(int) or :obj:`Color`, optional):
- Color of masks. The tuple of color should be in BGR order.
- Default: (255, 102, 61)
- det_bbox_color (str or tuple(int) or :obj:`Color`):Color of bbox lines.
- The tuple of color should be in BGR order. Default: (72, 101, 241)
- det_text_color (str or tuple(int) or :obj:`Color`):Color of texts.
- The tuple of color should be in BGR order. Default: (72, 101, 241)
- det_mask_color (str or tuple(int) or :obj:`Color`, optional):
- Color of masks. The tuple of color should be in BGR order.
- Default: (72, 101, 241)
- thickness (int): Thickness of lines. Default: 2
- font_size (int): Font size of texts. Default: 13
- win_name (str): The window name. Default: ''
- show (bool): Whether to show the image. Default: True
+ score_thr (float): Minimum score of bboxes to be shown. Default: 0.
+ gt_bbox_color (list[tuple] | tuple | str | None): Colors of bbox lines.
+ If a single color is given, it will be applied to all classes.
+ The tuple of color should be in RGB order. Default: (61, 102, 255).
+ gt_text_color (list[tuple] | tuple | str | None): Colors of texts.
+ If a single color is given, it will be applied to all classes.
+ The tuple of color should be in RGB order. Default: (200, 200, 200).
+ gt_mask_color (list[tuple] | tuple | str | None, optional): Colors of
+ masks. If a single color is given, it will be applied to all classes.
+ The tuple of color should be in RGB order. Default: (61, 102, 255).
+ det_bbox_color (list[tuple] | tuple | str | None):Colors of bbox lines.
+ If a single color is given, it will be applied to all classes.
+ The tuple of color should be in RGB order. Default: (241, 101, 72).
+ det_text_color (list[tuple] | tuple | str | None):Colors of texts.
+ If a single color is given, it will be applied to all classes.
+ The tuple of color should be in RGB order. Default: (200, 200, 200).
+ det_mask_color (list[tuple] | tuple | str | None, optional): Color of
+ masks. If a single color is given, it will be applied to all classes.
+ The tuple of color should be in RGB order. Default: (241, 101, 72).
+ thickness (int): Thickness of lines. Default: 2.
+ font_size (int): Font size of texts. Default: 13.
+ win_name (str): The window name. Default: ''.
+ show (bool): Whether to show the image. Default: True.
wait_time (float): Value of waitKey param. Default: 0.
out_file (str, optional): The filename to write the image.
- Default: None
+ Default: None.
Returns:
ndarray: The image with bboxes or masks drawn on it.
"""
assert 'gt_bboxes' in annotation
assert 'gt_labels' in annotation
- assert isinstance(
- result,
- (tuple, list)), f'Expected tuple or list, but get {type(result)}'
+ assert isinstance(result, (tuple, list, dict)), 'Expected ' \
+ f'tuple or list or dict, but get {type(result)}'
+ gt_bboxes = annotation['gt_bboxes']
+ gt_labels = annotation['gt_labels']
gt_masks = annotation.get('gt_masks', None)
if gt_masks is not None:
gt_masks = mask2ndarray(gt_masks)
+ gt_seg = annotation.get('gt_semantic_seg', None)
+ if gt_seg is not None:
+ pad_value = 255 # the padding value of gt_seg
+ sem_labels = np.unique(gt_seg)
+ all_labels = np.concatenate((gt_labels, sem_labels), axis=0)
+ all_labels, counts = np.unique(all_labels, return_counts=True)
+ stuff_labels = all_labels[np.logical_and(counts < 2,
+ all_labels != pad_value)]
+ stuff_masks = gt_seg[None] == stuff_labels[:, None, None]
+ gt_labels = np.concatenate((gt_labels, stuff_labels), axis=0)
+ gt_masks = np.concatenate((gt_masks, stuff_masks.astype(np.uint8)),
+ axis=0)
+ # If you need to show the bounding boxes,
+ # please comment the following line
+ # gt_bboxes = None
+
img = mmcv.imread(img)
img = imshow_det_bboxes(
img,
- annotation['gt_bboxes'],
- annotation['gt_labels'],
+ gt_bboxes,
+ gt_labels,
gt_masks,
class_names=class_names,
bbox_color=gt_bbox_color,
@@ -264,25 +472,38 @@ def imshow_gt_det_bboxes(img,
win_name=win_name,
show=False)
- if isinstance(result, tuple):
- bbox_result, segm_result = result
- if isinstance(segm_result, tuple):
- segm_result = segm_result[0] # ms rcnn
+ if not isinstance(result, dict):
+ if isinstance(result, tuple):
+ bbox_result, segm_result = result
+ if isinstance(segm_result, tuple):
+ segm_result = segm_result[0] # ms rcnn
+ else:
+ bbox_result, segm_result = result, None
+
+ bboxes = np.vstack(bbox_result)
+ labels = [
+ np.full(bbox.shape[0], i, dtype=np.int32)
+ for i, bbox in enumerate(bbox_result)
+ ]
+ labels = np.concatenate(labels)
+
+ segms = None
+ if segm_result is not None and len(labels) > 0: # non empty
+ segms = mmcv.concat_list(segm_result)
+ segms = mask_util.decode(segms)
+ segms = segms.transpose(2, 0, 1)
else:
- bbox_result, segm_result = result, None
-
- bboxes = np.vstack(bbox_result)
- labels = [
- np.full(bbox.shape[0], i, dtype=np.int32)
- for i, bbox in enumerate(bbox_result)
- ]
- labels = np.concatenate(labels)
-
- segms = None
- if segm_result is not None and len(labels) > 0: # non empty
- segms = mmcv.concat_list(segm_result)
- segms = mask_util.decode(segms)
- segms = segms.transpose(2, 0, 1)
+ assert class_names is not None, 'We need to know the number ' \
+ 'of classes.'
+ VOID = len(class_names)
+ bboxes = None
+ pan_results = result['pan_results']
+ # keep objects ahead
+ ids = np.unique(pan_results)[::-1]
+ legal_indices = ids != VOID
+ ids = ids[legal_indices]
+ labels = np.array([id % INSTANCE_OFFSET for id in ids], dtype=np.int64)
+ segms = (pan_results[None] == ids[:, None, None])
img = imshow_det_bboxes(
img,