show / mmdetection-2.26.0 /mmdet /core /utils /misc.py

thanks to show ❤

3bbb319 over 2 years ago

7.15 kB

	# Copyright (c) OpenMMLab. All rights reserved.
	from functools import partial

	import numpy as np
	import torch
	from six.moves import map, zip

	from ..mask.structures import BitmapMasks, PolygonMasks


	def multi_apply(func, args, *kwargs):
	"""Apply function to a list of arguments.

	Note:
	This function applies the ``func`` to multiple inputs and
	map the multiple outputs of the ``func`` into different
	list. Each list contains the same type of outputs corresponding
	to different inputs.

	Args:
	func (Function): A function that will be applied to a list of
	arguments

	Returns:
	tuple(list): A tuple containing multiple list, each list contains \
	a kind of returned results by the function
	"""
	pfunc = partial(func, **kwargs) if kwargs else func
	map_results = map(pfunc, *args)
	return tuple(map(list, zip(*map_results)))


	def unmap(data, count, inds, fill=0):
	"""Unmap a subset of item (data) back to the original set of items (of size
	count)"""
	if data.dim() == 1:
	ret = data.new_full((count, ), fill)
	ret[inds.type(torch.bool)] = data
	else:
	new_size = (count, ) + data.size()[1:]
	ret = data.new_full(new_size, fill)
	ret[inds.type(torch.bool), :] = data
	return ret


	def mask2ndarray(mask):
	"""Convert Mask to ndarray..

	Args:
	mask (:obj:`BitmapMasks` or :obj:`PolygonMasks` or
	torch.Tensor or np.ndarray): The mask to be converted.

	Returns:
	np.ndarray: Ndarray mask of shape (n, h, w) that has been converted
	"""
	if isinstance(mask, (BitmapMasks, PolygonMasks)):
	mask = mask.to_ndarray()
	elif isinstance(mask, torch.Tensor):
	mask = mask.detach().cpu().numpy()
	elif not isinstance(mask, np.ndarray):
	raise TypeError(f'Unsupported {type(mask)} data type')
	return mask


	def flip_tensor(src_tensor, flip_direction):
	"""flip tensor base on flip_direction.

	Args:
	src_tensor (Tensor): input feature map, shape (B, C, H, W).
	flip_direction (str): The flipping direction. Options are
	'horizontal', 'vertical', 'diagonal'.

	Returns:
	out_tensor (Tensor): Flipped tensor.
	"""
	assert src_tensor.ndim == 4
	valid_directions = ['horizontal', 'vertical', 'diagonal']
	assert flip_direction in valid_directions
	if flip_direction == 'horizontal':
	out_tensor = torch.flip(src_tensor, [3])
	elif flip_direction == 'vertical':
	out_tensor = torch.flip(src_tensor, [2])
	else:
	out_tensor = torch.flip(src_tensor, [2, 3])
	return out_tensor


	def select_single_mlvl(mlvl_tensors, batch_id, detach=True):
	"""Extract a multi-scale single image tensor from a multi-scale batch
	tensor based on batch index.

	Note: The default value of detach is True, because the proposal gradient
	needs to be detached during the training of the two-stage model. E.g
	Cascade Mask R-CNN.

	Args:
	mlvl_tensors (list[Tensor]): Batch tensor for all scale levels,
	each is a 4D-tensor.
	batch_id (int): Batch index.
	detach (bool): Whether detach gradient. Default True.

	Returns:
	list[Tensor]: Multi-scale single image tensor.
	"""
	assert isinstance(mlvl_tensors, (list, tuple))
	num_levels = len(mlvl_tensors)

	if detach:
	mlvl_tensor_list = [
	mlvl_tensors[i][batch_id].detach() for i in range(num_levels)
	]
	else:
	mlvl_tensor_list = [
	mlvl_tensors[i][batch_id] for i in range(num_levels)
	]
	return mlvl_tensor_list


	def filter_scores_and_topk(scores, score_thr, topk, results=None):
	"""Filter results using score threshold and topk candidates.

	Args:
	scores (Tensor): The scores, shape (num_bboxes, K).
	score_thr (float): The score filter threshold.
	topk (int): The number of topk candidates.
	results (dict or list or Tensor, Optional): The results to
	which the filtering rule is to be applied. The shape
	of each item is (num_bboxes, N).

	Returns:
	tuple: Filtered results

	- scores (Tensor): The scores after being filtered, \
	shape (num_bboxes_filtered, ).
	- labels (Tensor): The class labels, shape \
	(num_bboxes_filtered, ).
	- anchor_idxs (Tensor): The anchor indexes, shape \
	(num_bboxes_filtered, ).
	- filtered_results (dict or list or Tensor, Optional): \
	The filtered results. The shape of each item is \
	(num_bboxes_filtered, N).
	"""
	valid_mask = scores > score_thr
	scores = scores[valid_mask]
	valid_idxs = torch.nonzero(valid_mask)

	num_topk = min(topk, valid_idxs.size(0))
	# torch.sort is actually faster than .topk (at least on GPUs)
	scores, idxs = scores.sort(descending=True)
	scores = scores[:num_topk]
	topk_idxs = valid_idxs[idxs[:num_topk]]
	keep_idxs, labels = topk_idxs.unbind(dim=1)

	filtered_results = None
	if results is not None:
	if isinstance(results, dict):
	filtered_results = {k: v[keep_idxs] for k, v in results.items()}
	elif isinstance(results, list):
	filtered_results = [result[keep_idxs] for result in results]
	elif isinstance(results, torch.Tensor):
	filtered_results = results[keep_idxs]
	else:
	raise NotImplementedError(f'Only supports dict or list or Tensor, '
	f'but get {type(results)}.')
	return scores, labels, keep_idxs, filtered_results


	def center_of_mass(mask, esp=1e-6):
	"""Calculate the centroid coordinates of the mask.

	Args:
	mask (Tensor): The mask to be calculated, shape (h, w).
	esp (float): Avoid dividing by zero. Default: 1e-6.

	Returns:
	tuple[Tensor]: the coordinates of the center point of the mask.

	- center_h (Tensor): the center point of the height.
	- center_w (Tensor): the center point of the width.
	"""
	h, w = mask.shape
	grid_h = torch.arange(h, device=mask.device)[:, None]
	grid_w = torch.arange(w, device=mask.device)
	normalizer = mask.sum().float().clamp(min=esp)
	center_h = (mask * grid_h).sum() / normalizer
	center_w = (mask * grid_w).sum() / normalizer
	return center_h, center_w


	def generate_coordinate(featmap_sizes, device='cuda'):
	"""Generate the coordinate.

	Args:
	featmap_sizes (tuple): The feature to be calculated,
	of shape (N, C, W, H).
	device (str): The device where the feature will be put on.
	Returns:
	coord_feat (Tensor): The coordinate feature, of shape (N, 2, W, H).
	"""

	x_range = torch.linspace(-1, 1, featmap_sizes[-1], device=device)
	y_range = torch.linspace(-1, 1, featmap_sizes[-2], device=device)
	y, x = torch.meshgrid(y_range, x_range)
	y = y.expand([featmap_sizes[0], 1, -1, -1])
	x = x.expand([featmap_sizes[0], 1, -1, -1])
	coord_feat = torch.cat([x, y], 1)

	return coord_feat