# Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved. import unittest import torch import detectron2.model_zoo as model_zoo from detectron2.config import get_cfg from detectron2.modeling import build_model from detectron2.structures import BitMasks, Boxes, ImageList, Instances from detectron2.utils.events import EventStorage def get_model_zoo(config_path): """ Like model_zoo.get, but do not load any weights (even pretrained) """ cfg_file = model_zoo.get_config_file(config_path) cfg = get_cfg() cfg.merge_from_file(cfg_file) if not torch.cuda.is_available(): cfg.MODEL.DEVICE = "cpu" return build_model(cfg) def create_model_input(img, inst=None): if inst is not None: return {"image": img, "instances": inst} else: return {"image": img} def get_empty_instance(h, w): inst = Instances((h, w)) inst.gt_boxes = Boxes(torch.rand(0, 4)) inst.gt_classes = torch.tensor([]).to(dtype=torch.int64) inst.gt_masks = BitMasks(torch.rand(0, h, w)) return inst def get_regular_bitmask_instances(h, w): inst = Instances((h, w)) inst.gt_boxes = Boxes(torch.rand(3, 4)) inst.gt_boxes.tensor[:, 2:] += inst.gt_boxes.tensor[:, :2] inst.gt_classes = torch.tensor([3, 4, 5]).to(dtype=torch.int64) inst.gt_masks = BitMasks((torch.rand(3, h, w) > 0.5)) return inst class ModelE2ETest: def setUp(self): torch.manual_seed(43) self.model = get_model_zoo(self.CONFIG_PATH) def _test_eval(self, input_sizes): inputs = [create_model_input(torch.rand(3, s[0], s[1])) for s in input_sizes] self.model.eval() self.model(inputs) def _test_train(self, input_sizes, instances): assert len(input_sizes) == len(instances) inputs = [ create_model_input(torch.rand(3, s[0], s[1]), inst) for s, inst in zip(input_sizes, instances) ] self.model.train() with EventStorage(): losses = self.model(inputs) sum(losses.values()).backward() del losses def _inf_tensor(self, *shape): return 1.0 / torch.zeros(*shape, device=self.model.device) def _nan_tensor(self, *shape): return torch.zeros(*shape, device=self.model.device).fill_(float("nan")) def test_empty_data(self): instances = [get_empty_instance(200, 250), get_empty_instance(200, 249)] self._test_eval([(200, 250), (200, 249)]) self._test_train([(200, 250), (200, 249)], instances) @unittest.skipIf(not torch.cuda.is_available(), "CUDA unavailable") def test_eval_tocpu(self): model = get_model_zoo(self.CONFIG_PATH).cpu() model.eval() input_sizes = [(200, 250), (200, 249)] inputs = [create_model_input(torch.rand(3, s[0], s[1])) for s in input_sizes] model(inputs) class MaskRCNNE2ETest(ModelE2ETest, unittest.TestCase): CONFIG_PATH = "COCO-InstanceSegmentation/mask_rcnn_R_50_FPN_1x.yaml" def test_half_empty_data(self): instances = [get_empty_instance(200, 250), get_regular_bitmask_instances(200, 249)] self._test_train([(200, 250), (200, 249)], instances) # This test is flaky because in some environment the output features are zero due to relu # def test_rpn_inf_nan_data(self): # self.model.eval() # for tensor in [self._inf_tensor, self._nan_tensor]: # images = ImageList(tensor(1, 3, 512, 512), [(510, 510)]) # features = { # "p2": tensor(1, 256, 256, 256), # "p3": tensor(1, 256, 128, 128), # "p4": tensor(1, 256, 64, 64), # "p5": tensor(1, 256, 32, 32), # "p6": tensor(1, 256, 16, 16), # } # props, _ = self.model.proposal_generator(images, features) # self.assertEqual(len(props[0]), 0) def test_roiheads_inf_nan_data(self): self.model.eval() for tensor in [self._inf_tensor, self._nan_tensor]: images = ImageList(tensor(1, 3, 512, 512), [(510, 510)]) features = { "p2": tensor(1, 256, 256, 256), "p3": tensor(1, 256, 128, 128), "p4": tensor(1, 256, 64, 64), "p5": tensor(1, 256, 32, 32), "p6": tensor(1, 256, 16, 16), } props = [Instances((510, 510))] props[0].proposal_boxes = Boxes([[10, 10, 20, 20]]).to(device=self.model.device) props[0].objectness_logits = torch.tensor([1.0]).reshape(1, 1) det, _ = self.model.roi_heads(images, features, props) self.assertEqual(len(det[0]), 0) class RetinaNetE2ETest(ModelE2ETest, unittest.TestCase): CONFIG_PATH = "COCO-Detection/retinanet_R_50_FPN_1x.yaml" def test_inf_nan_data(self): self.model.eval() self.model.score_threshold = -999999999 for tensor in [self._inf_tensor, self._nan_tensor]: images = ImageList(tensor(1, 3, 512, 512), [(510, 510)]) features = [ tensor(1, 256, 128, 128), tensor(1, 256, 64, 64), tensor(1, 256, 32, 32), tensor(1, 256, 16, 16), tensor(1, 256, 8, 8), ] anchors = self.model.anchor_generator(features) box_cls, box_delta = self.model.head(features) box_cls = [tensor(*k.shape) for k in box_cls] box_delta = [tensor(*k.shape) for k in box_delta] det = self.model.inference(box_cls, box_delta, anchors, images.image_sizes) # all predictions (if any) are infinite or nan if len(det[0]): self.assertTrue(torch.isfinite(det[0].pred_boxes.tensor).sum() == 0)