Spaces:

Gradio-Blocks
/

CBNetV2

Running

App Files Files Community

CBNetV2 / patch

hysts HF staff

Add files

3fe1151 almost 3 years ago

raw

history blame

35.6 kB

	diff --git a/configs/cbnet/cascade_rcnn_cbv2d1_r2_101_mdconv_fpn_20e_fp16_ms400-1400_giou_4conv1f_coco.py b/configs/cbnet/cascade_rcnn_cbv2d1_r2_101_mdconv_fpn_20e_fp16_ms400-1400_giou_4conv1f_coco.py
	index 167d4379..7c0bd239 100644
	--- a/configs/cbnet/cascade_rcnn_cbv2d1_r2_101_mdconv_fpn_20e_fp16_ms400-1400_giou_4conv1f_coco.py
	+++ b/configs/cbnet/cascade_rcnn_cbv2d1_r2_101_mdconv_fpn_20e_fp16_ms400-1400_giou_4conv1f_coco.py
	@@ -2,9 +2,9 @@ _base_ = '../res2net/cascade_rcnn_r2_101_fpn_20e_coco.py'

	model = dict(
	backbone=dict(
	- type='CBRes2Net',
	+ type='CBRes2Net',
	cb_del_stages=1,
	- cb_inplanes=[64, 256, 512, 1024, 2048],
	+ cb_inplanes=[64, 256, 512, 1024, 2048],
	dcn=dict(type='DCNv2', deform_groups=1, fallback_on_stride=False),
	stage_with_dcn=(False, True, True, True)
	),
	@@ -28,7 +28,7 @@ model = dict(
	target_stds=[0.1, 0.1, 0.2, 0.2]),
	reg_class_agnostic=False,
	reg_decoded_bbox=True,
	- norm_cfg=dict(type='SyncBN', requires_grad=True),
	+ norm_cfg=dict(type='BN', requires_grad=True),
	loss_cls=dict(
	type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
	loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
	@@ -47,7 +47,7 @@ model = dict(
	target_stds=[0.05, 0.05, 0.1, 0.1]),
	reg_class_agnostic=False,
	reg_decoded_bbox=True,
	- norm_cfg=dict(type='SyncBN', requires_grad=True),
	+ norm_cfg=dict(type='BN', requires_grad=True),
	loss_cls=dict(
	type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
	loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
	@@ -66,7 +66,7 @@ model = dict(
	target_stds=[0.033, 0.033, 0.067, 0.067]),
	reg_class_agnostic=False,
	reg_decoded_bbox=True,
	- norm_cfg=dict(type='SyncBN', requires_grad=True),
	+ norm_cfg=dict(type='BN', requires_grad=True),
	loss_cls=dict(
	type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
	loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
	diff --git a/configs/cbnet/htc_cbv2_swin_base_patch4_window7_mstrain_400-1400_giou_4conv1f_adamw_20e_coco.py b/configs/cbnet/htc_cbv2_swin_base_patch4_window7_mstrain_400-1400_giou_4conv1f_adamw_20e_coco.py
	index 51edfd62..a7434c5d 100644
	--- a/configs/cbnet/htc_cbv2_swin_base_patch4_window7_mstrain_400-1400_giou_4conv1f_adamw_20e_coco.py
	+++ b/configs/cbnet/htc_cbv2_swin_base_patch4_window7_mstrain_400-1400_giou_4conv1f_adamw_20e_coco.py
	@@ -18,7 +18,7 @@ model = dict(
	target_stds=[0.1, 0.1, 0.2, 0.2]),
	reg_class_agnostic=True,
	reg_decoded_bbox=True,
	- norm_cfg=dict(type='SyncBN', requires_grad=True),
	+ norm_cfg=dict(type='BN', requires_grad=True),
	loss_cls=dict(
	type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
	loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
	@@ -37,7 +37,7 @@ model = dict(
	target_stds=[0.05, 0.05, 0.1, 0.1]),
	reg_class_agnostic=True,
	reg_decoded_bbox=True,
	- norm_cfg=dict(type='SyncBN', requires_grad=True),
	+ norm_cfg=dict(type='BN', requires_grad=True),
	loss_cls=dict(
	type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
	loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
	@@ -56,7 +56,7 @@ model = dict(
	target_stds=[0.033, 0.033, 0.067, 0.067]),
	reg_class_agnostic=True,
	reg_decoded_bbox=True,
	- norm_cfg=dict(type='SyncBN', requires_grad=True),
	+ norm_cfg=dict(type='BN', requires_grad=True),
	loss_cls=dict(
	type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0),
	loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
	diff --git a/mmdet/__init__.py b/mmdet/__init__.py
	index 646ee84e..9e846286 100644
	--- a/mmdet/__init__.py
	+++ b/mmdet/__init__.py
	@@ -20,9 +20,9 @@ mmcv_maximum_version = '1.4.0'
	mmcv_version = digit_version(mmcv.__version__)


	-assert (mmcv_version >= digit_version(mmcv_minimum_version)
	- and mmcv_version <= digit_version(mmcv_maximum_version)), \
	- f'MMCV=={mmcv.__version__} is used but incompatible. ' \
	- f'Please install mmcv>={mmcv_minimum_version}, <={mmcv_maximum_version}.'
	+#assert (mmcv_version >= digit_version(mmcv_minimum_version)
	+# and mmcv_version <= digit_version(mmcv_maximum_version)), \
	+# f'MMCV=={mmcv.__version__} is used but incompatible. ' \
	+# f'Please install mmcv>={mmcv_minimum_version}, <={mmcv_maximum_version}.'

	__all__ = ['__version__', 'short_version']
	diff --git a/mmdet/core/mask/structures.py b/mmdet/core/mask/structures.py
	index 6f5a62ae..a9d0ebb4 100644
	--- a/mmdet/core/mask/structures.py
	+++ b/mmdet/core/mask/structures.py
	@@ -1,3 +1,4 @@
	+# Copyright (c) OpenMMLab. All rights reserved.
	from abc import ABCMeta, abstractmethod

	import cv2
	@@ -528,6 +529,21 @@ class BitmapMasks(BaseInstanceMasks):
	self = cls(masks, height=height, width=width)
	return self

	+ def get_bboxes(self):
	+ num_masks = len(self)
	+ boxes = np.zeros((num_masks, 4), dtype=np.float32)
	+ x_any = self.masks.any(axis=1)
	+ y_any = self.masks.any(axis=2)
	+ for idx in range(num_masks):
	+ x = np.where(x_any[idx, :])[0]
	+ y = np.where(y_any[idx, :])[0]
	+ if len(x) > 0 and len(y) > 0:
	+ # use +1 for x_max and y_max so that the right and bottom
	+ # boundary of instance masks are fully included by the box
	+ boxes[idx, :] = np.array([x[0], y[0], x[-1] + 1, y[-1] + 1],
	+ dtype=np.float32)
	+ return boxes
	+

	class PolygonMasks(BaseInstanceMasks):
	"""This class represents masks in the form of polygons.
	@@ -637,8 +653,8 @@ class PolygonMasks(BaseInstanceMasks):
	resized_poly = []
	for p in poly_per_obj:
	p = p.copy()
	- p[0::2] *= w_scale
	- p[1::2] *= h_scale
	+ p[0::2] = p[0::2] * w_scale
	+ p[1::2] = p[1::2] * h_scale
	resized_poly.append(p)
	resized_masks.append(resized_poly)
	resized_masks = PolygonMasks(resized_masks, *out_shape)
	@@ -690,8 +706,8 @@ class PolygonMasks(BaseInstanceMasks):
	for p in poly_per_obj:
	# pycocotools will clip the boundary
	p = p.copy()
	- p[0::2] -= bbox[0]
	- p[1::2] -= bbox[1]
	+ p[0::2] = p[0::2] - bbox[0]
	+ p[1::2] = p[1::2] - bbox[1]
	cropped_poly_per_obj.append(p)
	cropped_masks.append(cropped_poly_per_obj)
	cropped_masks = PolygonMasks(cropped_masks, h, w)
	@@ -736,12 +752,12 @@ class PolygonMasks(BaseInstanceMasks):
	p = p.copy()
	# crop
	# pycocotools will clip the boundary
	- p[0::2] -= bbox[0]
	- p[1::2] -= bbox[1]
	+ p[0::2] = p[0::2] - bbox[0]
	+ p[1::2] = p[1::2] - bbox[1]

	# resize
	- p[0::2] *= w_scale
	- p[1::2] *= h_scale
	+ p[0::2] = p[0::2] * w_scale
	+ p[1::2] = p[1::2] * h_scale
	resized_mask.append(p)
	resized_masks.append(resized_mask)
	return PolygonMasks(resized_masks, *out_shape)
	@@ -944,6 +960,7 @@ class PolygonMasks(BaseInstanceMasks):
	a list of vertices, in CCW order.
	"""
	from scipy.stats import truncnorm
	+
	# Generate around the unit circle
	cx, cy = (0.0, 0.0)
	radius = 1
	@@ -1019,6 +1036,24 @@ class PolygonMasks(BaseInstanceMasks):
	self = cls(masks, height, width)
	return self

	+ def get_bboxes(self):
	+ num_masks = len(self)
	+ boxes = np.zeros((num_masks, 4), dtype=np.float32)
	+ for idx, poly_per_obj in enumerate(self.masks):
	+ # simply use a number that is big enough for comparison with
	+ # coordinates
	+ xy_min = np.array([self.width * 2, self.height * 2],
	+ dtype=np.float32)
	+ xy_max = np.zeros(2, dtype=np.float32)
	+ for p in poly_per_obj:
	+ xy = np.array(p).reshape(-1, 2).astype(np.float32)
	+ xy_min = np.minimum(xy_min, np.min(xy, axis=0))
	+ xy_max = np.maximum(xy_max, np.max(xy, axis=0))
	+ boxes[idx, :2] = xy_min
	+ boxes[idx, 2:] = xy_max
	+
	+ return boxes
	+

	def polygon_to_bitmap(polygons, height, width):
	"""Convert masks from the form of polygons to bitmaps.
	@@ -1035,3 +1070,33 @@ def polygon_to_bitmap(polygons, height, width):
	rle = maskUtils.merge(rles)
	bitmap_mask = maskUtils.decode(rle).astype(np.bool)
	return bitmap_mask
	+
	+
	+def bitmap_to_polygon(bitmap):
	+ """Convert masks from the form of bitmaps to polygons.
	+
	+ Args:
	+ bitmap (ndarray): masks in bitmap representation.
	+
	+ Return:
	+ list[ndarray]: the converted mask in polygon representation.
	+ bool: whether the mask has holes.
	+ """
	+ bitmap = np.ascontiguousarray(bitmap).astype(np.uint8)
	+ # cv2.RETR_CCOMP: retrieves all of the contours and organizes them
	+ # into a two-level hierarchy. At the top level, there are external
	+ # boundaries of the components. At the second level, there are
	+ # boundaries of the holes. If there is another contour inside a hole
	+ # of a connected component, it is still put at the top level.
	+ # cv2.CHAIN_APPROX_NONE: stores absolutely all the contour points.
	+ outs = cv2.findContours(bitmap, cv2.RETR_CCOMP, cv2.CHAIN_APPROX_NONE)
	+ contours = outs[-2]
	+ hierarchy = outs[-1]
	+ if hierarchy is None:
	+ return [], False
	+ # hierarchy[i]: 4 elements, for the indexes of next, previous,
	+ # parent, or nested contours. If there is no corresponding contour,
	+ # it will be -1.
	+ with_hole = (hierarchy.reshape(-1, 4)[:, 3] >= 0).any()
	+ contours = [c.reshape(-1, 2) for c in contours]
	+ return contours, with_hole
	diff --git a/mmdet/core/visualization/image.py b/mmdet/core/visualization/image.py
	index 5a148384..66f82a38 100644
	--- a/mmdet/core/visualization/image.py
	+++ b/mmdet/core/visualization/image.py
	@@ -1,3 +1,5 @@
	+# Copyright (c) OpenMMLab. All rights reserved.
	+import cv2
	import matplotlib.pyplot as plt
	import mmcv
	import numpy as np
	@@ -5,17 +7,25 @@ import pycocotools.mask as mask_util
	from matplotlib.collections import PatchCollection
	from matplotlib.patches import Polygon

	+#from mmdet.core.evaluation.panoptic_utils import INSTANCE_OFFSET
	+from ..mask.structures import bitmap_to_polygon
	from ..utils import mask2ndarray
	+from .palette import get_palette, palette_val
	+
	+__all__ = [
	+ 'color_val_matplotlib', 'draw_masks', 'draw_bboxes', 'draw_labels',
	+ 'imshow_det_bboxes', 'imshow_gt_det_bboxes'
	+]

	EPS = 1e-2


	def color_val_matplotlib(color):
	"""Convert various input in BGR order to normalized RGB matplotlib color
	- tuples,
	+ tuples.

	Args:
	- color (:obj:`Color`/str/tuple/int/ndarray): Color inputs
	+ color (:obj`Color` \| str \| tuple \| int \| ndarray): Color inputs.

	Returns:
	tuple[float]: A tuple of 3 normalized floats indicating RGB channels.
	@@ -25,9 +35,177 @@ def color_val_matplotlib(color):
	return tuple(color)


	+def _get_adaptive_scales(areas, min_area=800, max_area=30000):
	+ """Get adaptive scales according to areas.
	+
	+ The scale range is [0.5, 1.0]. When the area is less than
	+ ``'min_area'``, the scale is 0.5 while the area is larger than
	+ ``'max_area'``, the scale is 1.0.
	+
	+ Args:
	+ areas (ndarray): The areas of bboxes or masks with the
	+ shape of (n, ).
	+ min_area (int): Lower bound areas for adaptive scales.
	+ Default: 800.
	+ max_area (int): Upper bound areas for adaptive scales.
	+ Default: 30000.
	+
	+ Returns:
	+ ndarray: The adaotive scales with the shape of (n, ).
	+ """
	+ scales = 0.5 + (areas - min_area) / (max_area - min_area)
	+ scales = np.clip(scales, 0.5, 1.0)
	+ return scales
	+
	+
	+def _get_bias_color(base, max_dist=30):
	+ """Get different colors for each masks.
	+
	+ Get different colors for each masks by adding a bias
	+ color to the base category color.
	+ Args:
	+ base (ndarray): The base category color with the shape
	+ of (3, ).
	+ max_dist (int): The max distance of bias. Default: 30.
	+
	+ Returns:
	+ ndarray: The new color for a mask with the shape of (3, ).
	+ """
	+ new_color = base + np.random.randint(
	+ low=-max_dist, high=max_dist + 1, size=3)
	+ return np.clip(new_color, 0, 255, new_color)
	+
	+
	+def draw_bboxes(ax, bboxes, color='g', alpha=0.8, thickness=2):
	+ """Draw bounding boxes on the axes.
	+
	+ Args:
	+ ax (matplotlib.Axes): The input axes.
	+ bboxes (ndarray): The input bounding boxes with the shape
	+ of (n, 4).
	+ color (list[tuple] \| matplotlib.color): the colors for each
	+ bounding boxes.
	+ alpha (float): Transparency of bounding boxes. Default: 0.8.
	+ thickness (int): Thickness of lines. Default: 2.
	+
	+ Returns:
	+ matplotlib.Axes: The result axes.
	+ """
	+ polygons = []
	+ for i, bbox in enumerate(bboxes):
	+ bbox_int = bbox.astype(np.int32)
	+ poly = [[bbox_int[0], bbox_int[1]], [bbox_int[0], bbox_int[3]],
	+ [bbox_int[2], bbox_int[3]], [bbox_int[2], bbox_int[1]]]
	+ np_poly = np.array(poly).reshape((4, 2))
	+ polygons.append(Polygon(np_poly))
	+ p = PatchCollection(
	+ polygons,
	+ facecolor='none',
	+ edgecolors=color,
	+ linewidths=thickness,
	+ alpha=alpha)
	+ ax.add_collection(p)
	+
	+ return ax
	+
	+
	+def draw_labels(ax,
	+ labels,
	+ positions,
	+ scores=None,
	+ class_names=None,
	+ color='w',
	+ font_size=8,
	+ scales=None,
	+ horizontal_alignment='left'):
	+ """Draw labels on the axes.
	+
	+ Args:
	+ ax (matplotlib.Axes): The input axes.
	+ labels (ndarray): The labels with the shape of (n, ).
	+ positions (ndarray): The positions to draw each labels.
	+ scores (ndarray): The scores for each labels.
	+ class_names (list[str]): The class names.
	+ color (list[tuple] \| matplotlib.color): The colors for labels.
	+ font_size (int): Font size of texts. Default: 8.
	+ scales (list[float]): Scales of texts. Default: None.
	+ horizontal_alignment (str): The horizontal alignment method of
	+ texts. Default: 'left'.
	+
	+ Returns:
	+ matplotlib.Axes: The result axes.
	+ """
	+ for i, (pos, label) in enumerate(zip(positions, labels)):
	+ label_text = class_names[
	+ label] if class_names is not None else f'class {label}'
	+ if scores is not None:
	+ label_text += f'\|{scores[i]:.02f}'
	+ text_color = color[i] if isinstance(color, list) else color
	+
	+ font_size_mask = font_size if scales is None else font_size * scales[i]
	+ ax.text(
	+ pos[0],
	+ pos[1],
	+ f'{label_text}',
	+ bbox={
	+ 'facecolor': 'black',
	+ 'alpha': 0.8,
	+ 'pad': 0.7,
	+ 'edgecolor': 'none'
	+ },
	+ color=text_color,
	+ fontsize=font_size_mask,
	+ verticalalignment='top',
	+ horizontalalignment=horizontal_alignment)
	+
	+ return ax
	+
	+
	+def draw_masks(ax, img, masks, color=None, with_edge=True, alpha=0.8):
	+ """Draw masks on the image and their edges on the axes.
	+
	+ Args:
	+ ax (matplotlib.Axes): The input axes.
	+ img (ndarray): The image with the shape of (3, h, w).
	+ masks (ndarray): The masks with the shape of (n, h, w).
	+ color (ndarray): The colors for each masks with the shape
	+ of (n, 3).
	+ with_edge (bool): Whether to draw edges. Default: True.
	+ alpha (float): Transparency of bounding boxes. Default: 0.8.
	+
	+ Returns:
	+ matplotlib.Axes: The result axes.
	+ ndarray: The result image.
	+ """
	+ taken_colors = set([0, 0, 0])
	+ if color is None:
	+ random_colors = np.random.randint(0, 255, (masks.size(0), 3))
	+ color = [tuple(c) for c in random_colors]
	+ color = np.array(color, dtype=np.uint8)
	+ polygons = []
	+ for i, mask in enumerate(masks):
	+ if with_edge:
	+ contours, _ = bitmap_to_polygon(mask)
	+ polygons += [Polygon(c) for c in contours]
	+
	+ color_mask = color[i]
	+ while tuple(color_mask) in taken_colors:
	+ color_mask = _get_bias_color(color_mask)
	+ taken_colors.add(tuple(color_mask))
	+
	+ mask = mask.astype(bool)
	+ img[mask] = img[mask] * (1 - alpha) + color_mask * alpha
	+
	+ p = PatchCollection(
	+ polygons, facecolor='none', edgecolors='w', linewidths=1, alpha=0.8)
	+ ax.add_collection(p)
	+
	+ return ax, img
	+
	+
	def imshow_det_bboxes(img,
	- bboxes,
	- labels,
	+ bboxes=None,
	+ labels=None,
	segms=None,
	class_names=None,
	score_thr=0,
	@@ -35,7 +213,7 @@ def imshow_det_bboxes(img,
	text_color='green',
	mask_color=None,
	thickness=2,
	- font_size=13,
	+ font_size=8,
	win_name='',
	show=True,
	wait_time=0,
	@@ -43,43 +221,51 @@ def imshow_det_bboxes(img,
	"""Draw bboxes and class labels (with scores) on an image.

	Args:
	- img (str or ndarray): The image to be displayed.
	+ img (str \| ndarray): The image to be displayed.
	bboxes (ndarray): Bounding boxes (with scores), shaped (n, 4) or
	(n, 5).
	labels (ndarray): Labels of bboxes.
	- segms (ndarray or None): Masks, shaped (n,h,w) or None
	+ segms (ndarray \| None): Masks, shaped (n,h,w) or None.
	class_names (list[str]): Names of each classes.
	- score_thr (float): Minimum score of bboxes to be shown. Default: 0
	- bbox_color (str or tuple(int) or :obj:`Color`):Color of bbox lines.
	- The tuple of color should be in BGR order. Default: 'green'
	- text_color (str or tuple(int) or :obj:`Color`):Color of texts.
	- The tuple of color should be in BGR order. Default: 'green'
	- mask_color (str or tuple(int) or :obj:`Color`, optional):
	- Color of masks. The tuple of color should be in BGR order.
	- Default: None
	- thickness (int): Thickness of lines. Default: 2
	- font_size (int): Font size of texts. Default: 13
	- show (bool): Whether to show the image. Default: True
	- win_name (str): The window name. Default: ''
	+ score_thr (float): Minimum score of bboxes to be shown. Default: 0.
	+ bbox_color (list[tuple] \| tuple \| str \| None): Colors of bbox lines.
	+ If a single color is given, it will be applied to all classes.
	+ The tuple of color should be in RGB order. Default: 'green'.
	+ text_color (list[tuple] \| tuple \| str \| None): Colors of texts.
	+ If a single color is given, it will be applied to all classes.
	+ The tuple of color should be in RGB order. Default: 'green'.
	+ mask_color (list[tuple] \| tuple \| str \| None, optional): Colors of
	+ masks. If a single color is given, it will be applied to all
	+ classes. The tuple of color should be in RGB order.
	+ Default: None.
	+ thickness (int): Thickness of lines. Default: 2.
	+ font_size (int): Font size of texts. Default: 13.
	+ show (bool): Whether to show the image. Default: True.
	+ win_name (str): The window name. Default: ''.
	wait_time (float): Value of waitKey param. Default: 0.
	out_file (str, optional): The filename to write the image.
	- Default: None
	+ Default: None.

	Returns:
	ndarray: The image with bboxes drawn on it.
	"""
	- assert bboxes.ndim == 2, \
	+ assert bboxes is None or bboxes.ndim == 2, \
	f' bboxes ndim should be 2, but its ndim is {bboxes.ndim}.'
	assert labels.ndim == 1, \
	f' labels ndim should be 1, but its ndim is {labels.ndim}.'
	- assert bboxes.shape[0] == labels.shape[0], \
	- 'bboxes.shape[0] and labels.shape[0] should have the same length.'
	- assert bboxes.shape[1] == 4 or bboxes.shape[1] == 5, \
	+ assert bboxes is None or bboxes.shape[1] == 4 or bboxes.shape[1] == 5, \
	f' bboxes.shape[1] should be 4 or 5, but its {bboxes.shape[1]}.'
	+ assert bboxes is None or bboxes.shape[0] <= labels.shape[0], \
	+ 'labels.shape[0] should not be less than bboxes.shape[0].'
	+ assert segms is None or segms.shape[0] == labels.shape[0], \
	+ 'segms.shape[0] and labels.shape[0] should have the same length.'
	+ assert segms is not None or bboxes is not None, \
	+ 'segms and bboxes should not be None at the same time.'
	+
	img = mmcv.imread(img).astype(np.uint8)

	if score_thr > 0:
	- assert bboxes.shape[1] == 5
	+ assert bboxes is not None and bboxes.shape[1] == 5
	scores = bboxes[:, -1]
	inds = scores > score_thr
	bboxes = bboxes[inds, :]
	@@ -87,25 +273,6 @@ def imshow_det_bboxes(img,
	if segms is not None:
	segms = segms[inds, ...]

	- mask_colors = []
	- if labels.shape[0] > 0:
	- if mask_color is None:
	- # random color
	- np.random.seed(42)
	- mask_colors = [
	- np.random.randint(0, 256, (1, 3), dtype=np.uint8)
	- for _ in range(max(labels) + 1)
	- ]
	- else:
	- # specify color
	- mask_colors = [
	- np.array(mmcv.color_val(mask_color)[::-1], dtype=np.uint8)
	- ] * (
	- max(labels) + 1)
	-
	- bbox_color = color_val_matplotlib(bbox_color)
	- text_color = color_val_matplotlib(text_color)
	-
	img = mmcv.bgr2rgb(img)
	width, height = img.shape[1], img.shape[0]
	img = np.ascontiguousarray(img)
	@@ -123,44 +290,64 @@ def imshow_det_bboxes(img,
	ax = plt.gca()
	ax.axis('off')

	- polygons = []
	- color = []
	- for i, (bbox, label) in enumerate(zip(bboxes, labels)):
	- bbox_int = bbox.astype(np.int32)
	- poly = [[bbox_int[0], bbox_int[1]], [bbox_int[0], bbox_int[3]],
	- [bbox_int[2], bbox_int[3]], [bbox_int[2], bbox_int[1]]]
	- np_poly = np.array(poly).reshape((4, 2))
	- polygons.append(Polygon(np_poly))
	- color.append(bbox_color)
	- label_text = class_names[
	- label] if class_names is not None else f'class {label}'
	- if len(bbox) > 4:
	- label_text += f'\|{bbox[-1]:.02f}'
	- ax.text(
	- bbox_int[0],
	- bbox_int[1],
	- f'{label_text}',
	- bbox={
	- 'facecolor': 'black',
	- 'alpha': 0.8,
	- 'pad': 0.7,
	- 'edgecolor': 'none'
	- },
	- color=text_color,
	- fontsize=font_size,
	- verticalalignment='top',
	- horizontalalignment='left')
	- if segms is not None:
	- color_mask = mask_colors[labels[i]]
	- mask = segms[i].astype(bool)
	- img[mask] = img[mask] * 0.5 + color_mask * 0.5
	+ max_label = int(max(labels) if len(labels) > 0 else 0)
	+ text_palette = palette_val(get_palette(text_color, max_label + 1))
	+ text_colors = [text_palette[label] for label in labels]
	+
	+ num_bboxes = 0
	+ if bboxes is not None:
	+ num_bboxes = bboxes.shape[0]
	+ bbox_palette = palette_val(get_palette(bbox_color, max_label + 1))
	+ colors = [bbox_palette[label] for label in labels[:num_bboxes]]
	+ draw_bboxes(ax, bboxes, colors, alpha=0.8, thickness=thickness)
	+
	+ horizontal_alignment = 'left'
	+ positions = bboxes[:, :2].astype(np.int32) + thickness
	+ areas = (bboxes[:, 3] - bboxes[:, 1]) * (bboxes[:, 2] - bboxes[:, 0])
	+ scales = _get_adaptive_scales(areas)
	+ scores = bboxes[:, 4] if bboxes.shape[1] == 5 else None
	+ draw_labels(
	+ ax,
	+ labels[:num_bboxes],
	+ positions,
	+ scores=scores,
	+ class_names=class_names,
	+ color=text_colors,
	+ font_size=font_size,
	+ scales=scales,
	+ horizontal_alignment=horizontal_alignment)
	+
	+ if segms is not None:
	+ mask_palette = get_palette(mask_color, max_label + 1)
	+ colors = [mask_palette[label] for label in labels]
	+ colors = np.array(colors, dtype=np.uint8)
	+ draw_masks(ax, img, segms, colors, with_edge=True)
	+
	+ if num_bboxes < segms.shape[0]:
	+ segms = segms[num_bboxes:]
	+ horizontal_alignment = 'center'
	+ areas = []
	+ positions = []
	+ for mask in segms:
	+ _, _, stats, centroids = cv2.connectedComponentsWithStats(
	+ mask.astype(np.uint8), connectivity=8)
	+ largest_id = np.argmax(stats[1:, -1]) + 1
	+ positions.append(centroids[largest_id])
	+ areas.append(stats[largest_id, -1])
	+ areas = np.stack(areas, axis=0)
	+ scales = _get_adaptive_scales(areas)
	+ draw_labels(
	+ ax,
	+ labels[num_bboxes:],
	+ positions,
	+ class_names=class_names,
	+ color=text_colors,
	+ font_size=font_size,
	+ scales=scales,
	+ horizontal_alignment=horizontal_alignment)

	plt.imshow(img)

	- p = PatchCollection(
	- polygons, facecolor='none', edgecolors=color, linewidths=thickness)
	- ax.add_collection(p)
	-
	stream, _ = canvas.print_to_buffer()
	buffer = np.frombuffer(stream, dtype='uint8')
	img_rgba = buffer.reshape(height, width, 4)
	@@ -191,12 +378,12 @@ def imshow_gt_det_bboxes(img,
	result,
	class_names=None,
	score_thr=0,
	- gt_bbox_color=(255, 102, 61),
	- gt_text_color=(255, 102, 61),
	- gt_mask_color=(255, 102, 61),
	- det_bbox_color=(72, 101, 241),
	- det_text_color=(72, 101, 241),
	- det_mask_color=(72, 101, 241),
	+ gt_bbox_color=(61, 102, 255),
	+ gt_text_color=(200, 200, 200),
	+ gt_mask_color=(61, 102, 255),
	+ det_bbox_color=(241, 101, 72),
	+ det_text_color=(200, 200, 200),
	+ det_mask_color=(241, 101, 72),
	thickness=2,
	font_size=13,
	win_name='',
	@@ -206,54 +393,75 @@ def imshow_gt_det_bboxes(img,
	"""General visualization GT and result function.

	Args:
	- img (str or ndarray): The image to be displayed.)
	+ img (str \| ndarray): The image to be displayed.
	annotation (dict): Ground truth annotations where contain keys of
	- 'gt_bboxes' and 'gt_labels' or 'gt_masks'
	- result (tuple[list] or list): The detection result, can be either
	+ 'gt_bboxes' and 'gt_labels' or 'gt_masks'.
	+ result (tuple[list] \| list): The detection result, can be either
	(bbox, segm) or just bbox.
	class_names (list[str]): Names of each classes.
	- score_thr (float): Minimum score of bboxes to be shown. Default: 0
	- gt_bbox_color (str or tuple(int) or :obj:`Color`):Color of bbox lines.
	- The tuple of color should be in BGR order. Default: (255, 102, 61)
	- gt_text_color (str or tuple(int) or :obj:`Color`):Color of texts.
	- The tuple of color should be in BGR order. Default: (255, 102, 61)
	- gt_mask_color (str or tuple(int) or :obj:`Color`, optional):
	- Color of masks. The tuple of color should be in BGR order.
	- Default: (255, 102, 61)
	- det_bbox_color (str or tuple(int) or :obj:`Color`):Color of bbox lines.
	- The tuple of color should be in BGR order. Default: (72, 101, 241)
	- det_text_color (str or tuple(int) or :obj:`Color`):Color of texts.
	- The tuple of color should be in BGR order. Default: (72, 101, 241)
	- det_mask_color (str or tuple(int) or :obj:`Color`, optional):
	- Color of masks. The tuple of color should be in BGR order.
	- Default: (72, 101, 241)
	- thickness (int): Thickness of lines. Default: 2
	- font_size (int): Font size of texts. Default: 13
	- win_name (str): The window name. Default: ''
	- show (bool): Whether to show the image. Default: True
	+ score_thr (float): Minimum score of bboxes to be shown. Default: 0.
	+ gt_bbox_color (list[tuple] \| tuple \| str \| None): Colors of bbox lines.
	+ If a single color is given, it will be applied to all classes.
	+ The tuple of color should be in RGB order. Default: (61, 102, 255).
	+ gt_text_color (list[tuple] \| tuple \| str \| None): Colors of texts.
	+ If a single color is given, it will be applied to all classes.
	+ The tuple of color should be in RGB order. Default: (200, 200, 200).
	+ gt_mask_color (list[tuple] \| tuple \| str \| None, optional): Colors of
	+ masks. If a single color is given, it will be applied to all classes.
	+ The tuple of color should be in RGB order. Default: (61, 102, 255).
	+ det_bbox_color (list[tuple] \| tuple \| str \| None):Colors of bbox lines.
	+ If a single color is given, it will be applied to all classes.
	+ The tuple of color should be in RGB order. Default: (241, 101, 72).
	+ det_text_color (list[tuple] \| tuple \| str \| None):Colors of texts.
	+ If a single color is given, it will be applied to all classes.
	+ The tuple of color should be in RGB order. Default: (200, 200, 200).
	+ det_mask_color (list[tuple] \| tuple \| str \| None, optional): Color of
	+ masks. If a single color is given, it will be applied to all classes.
	+ The tuple of color should be in RGB order. Default: (241, 101, 72).
	+ thickness (int): Thickness of lines. Default: 2.
	+ font_size (int): Font size of texts. Default: 13.
	+ win_name (str): The window name. Default: ''.
	+ show (bool): Whether to show the image. Default: True.
	wait_time (float): Value of waitKey param. Default: 0.
	out_file (str, optional): The filename to write the image.
	- Default: None
	+ Default: None.

	Returns:
	ndarray: The image with bboxes or masks drawn on it.
	"""
	assert 'gt_bboxes' in annotation
	assert 'gt_labels' in annotation
	- assert isinstance(
	- result,
	- (tuple, list)), f'Expected tuple or list, but get {type(result)}'
	+ assert isinstance(result, (tuple, list, dict)), 'Expected ' \
	+ f'tuple or list or dict, but get {type(result)}'

	+ gt_bboxes = annotation['gt_bboxes']
	+ gt_labels = annotation['gt_labels']
	gt_masks = annotation.get('gt_masks', None)
	if gt_masks is not None:
	gt_masks = mask2ndarray(gt_masks)

	+ gt_seg = annotation.get('gt_semantic_seg', None)
	+ if gt_seg is not None:
	+ pad_value = 255 # the padding value of gt_seg
	+ sem_labels = np.unique(gt_seg)
	+ all_labels = np.concatenate((gt_labels, sem_labels), axis=0)
	+ all_labels, counts = np.unique(all_labels, return_counts=True)
	+ stuff_labels = all_labels[np.logical_and(counts < 2,
	+ all_labels != pad_value)]
	+ stuff_masks = gt_seg[None] == stuff_labels[:, None, None]
	+ gt_labels = np.concatenate((gt_labels, stuff_labels), axis=0)
	+ gt_masks = np.concatenate((gt_masks, stuff_masks.astype(np.uint8)),
	+ axis=0)
	+ # If you need to show the bounding boxes,
	+ # please comment the following line
	+ # gt_bboxes = None
	+
	img = mmcv.imread(img)

	img = imshow_det_bboxes(
	img,
	- annotation['gt_bboxes'],
	- annotation['gt_labels'],
	+ gt_bboxes,
	+ gt_labels,
	gt_masks,
	class_names=class_names,
	bbox_color=gt_bbox_color,
	@@ -264,25 +472,38 @@ def imshow_gt_det_bboxes(img,
	win_name=win_name,
	show=False)

	- if isinstance(result, tuple):
	- bbox_result, segm_result = result
	- if isinstance(segm_result, tuple):
	- segm_result = segm_result[0] # ms rcnn
	+ if not isinstance(result, dict):
	+ if isinstance(result, tuple):
	+ bbox_result, segm_result = result
	+ if isinstance(segm_result, tuple):
	+ segm_result = segm_result[0] # ms rcnn
	+ else:
	+ bbox_result, segm_result = result, None
	+
	+ bboxes = np.vstack(bbox_result)
	+ labels = [
	+ np.full(bbox.shape[0], i, dtype=np.int32)
	+ for i, bbox in enumerate(bbox_result)
	+ ]
	+ labels = np.concatenate(labels)
	+
	+ segms = None
	+ if segm_result is not None and len(labels) > 0: # non empty
	+ segms = mmcv.concat_list(segm_result)
	+ segms = mask_util.decode(segms)
	+ segms = segms.transpose(2, 0, 1)
	else:
	- bbox_result, segm_result = result, None
	-
	- bboxes = np.vstack(bbox_result)
	- labels = [
	- np.full(bbox.shape[0], i, dtype=np.int32)
	- for i, bbox in enumerate(bbox_result)
	- ]
	- labels = np.concatenate(labels)
	-
	- segms = None
	- if segm_result is not None and len(labels) > 0: # non empty
	- segms = mmcv.concat_list(segm_result)
	- segms = mask_util.decode(segms)
	- segms = segms.transpose(2, 0, 1)
	+ assert class_names is not None, 'We need to know the number ' \
	+ 'of classes.'
	+ VOID = len(class_names)
	+ bboxes = None
	+ pan_results = result['pan_results']
	+ # keep objects ahead
	+ ids = np.unique(pan_results)[::-1]
	+ legal_indices = ids != VOID
	+ ids = ids[legal_indices]
	+ labels = np.array([id % INSTANCE_OFFSET for id in ids], dtype=np.int64)
	+ segms = (pan_results[None] == ids[:, None, None])

	img = imshow_det_bboxes(
	img,