_BASE_: oneformer_R50_bs16_160k.yaml MODEL: BACKBONE: NAME: "D2DiNAT" DiNAT: EMBED_DIM: 192 MLP_RATIO: 2.0 DEPTHS: [3, 4, 18, 5] NUM_HEADS: [6, 12, 24, 48] KERNEL_SIZE: 11 DROP_PATH_RATE: 0.3 DILATIONS: [[1, 20, 1], [1, 5, 1, 10], [1, 2, 1, 3, 1, 4, 1, 5, 1, 2, 1, 3, 1, 4, 1, 5, 1, 5], [1, 2, 1, 2, 1]] WEIGHTS: "dinat_large_in22k_in1k_384_11x11.pkl" PIXEL_MEAN: [123.675, 116.280, 103.530] PIXEL_STD: [58.395, 57.120, 57.375] ONE_FORMER: NUM_OBJECT_QUERIES: 250 SOLVER: AMP: ENABLED: False INPUT: MIN_SIZE_TRAIN: !!python/object/apply:eval ["[int(x * 0.1 * 640) for x in range(5, 21)]"] MIN_SIZE_TRAIN_SAMPLING: "choice" MIN_SIZE_TEST: 640 MAX_SIZE_TRAIN: 2560 MAX_SIZE_TEST: 2560 CROP: ENABLED: True TYPE: "absolute" SIZE: (640, 640) SINGLE_CATEGORY_MAX_AREA: 1.0 COLOR_AUG_SSD: True SIZE_DIVISIBILITY: 640 # used in dataset mapper FORMAT: "RGB" TEST: DETECTIONS_PER_IMAGE: 250 EVAL_PERIOD: 5000 AUG: ENABLED: False MIN_SIZES: [320, 480, 640, 800, 960, 1120] MAX_SIZE: 4480 FLIP: True