_BASE_: ../maskformer_R50_bs16_160k.yaml MODEL: BACKBONE: NAME: "D2SwinTransformer" SWIN: EMBED_DIM: 128 DEPTHS: [2, 2, 18, 2] NUM_HEADS: [4, 8, 16, 32] WINDOW_SIZE: 12 APE: False DROP_PATH_RATE: 0.3 PATCH_NORM: True PRETRAIN_IMG_SIZE: 384 WEIGHTS: "pretrained_weights/swin_base_patch4_window12_384_22k.pkl" PIXEL_MEAN: [123.675, 116.280, 103.530] PIXEL_STD: [58.395, 57.120, 57.375] SOLVER: BASE_LR: 0.00006 WARMUP_FACTOR: 1e-6 WARMUP_ITERS: 1500 WEIGHT_DECAY: 0.01 WEIGHT_DECAY_NORM: 0.0 WEIGHT_DECAY_EMBED: 0.0 BACKBONE_MULTIPLIER: 1.0 INPUT: MIN_SIZE_TRAIN: !!python/object/apply:eval ["[int(x * 0.1 * 640) for x in range(5, 21)]"] MIN_SIZE_TRAIN_SAMPLING: "choice" MIN_SIZE_TEST: 640 MAX_SIZE_TRAIN: 2560 MAX_SIZE_TEST: 2560 CROP: ENABLED: True TYPE: "absolute" SIZE: (640, 640) SINGLE_CATEGORY_MAX_AREA: 1.0 COLOR_AUG_SSD: True SIZE_DIVISIBILITY: 640 # used in dataset mapper FORMAT: "RGB" TEST: EVAL_PERIOD: 5000 AUG: ENABLED: False MIN_SIZES: [320, 480, 640, 800, 960, 1120] MAX_SIZE: 4480 FLIP: True