MODEL: META_ARCHITECTURE: "DeformableDetr" WEIGHTS: "detectron2://ImageNetPretrained/torchvision/R-50.pkl" PIXEL_MEAN: [123.675, 116.280, 103.530] PIXEL_STD: [58.395, 57.120, 57.375] MASK_ON: False RESNETS: DEPTH: 50 STRIDE_IN_1X1: False OUT_FEATURES: ["res3", "res4", "res5"] DETR: CLS_WEIGHT: 2.0 GIOU_WEIGHT: 2.0 L1_WEIGHT: 5.0 NUM_OBJECT_QUERIES: 300 DIM_FEEDFORWARD: 1024 WITH_BOX_REFINE: True TWO_STAGE: True NUM_CLASSES: 1203 USE_FED_LOSS: True DATASETS: TRAIN: ("lvis_v1_train",) TEST: ("lvis_v1_val",) SOLVER: CHECKPOINT_PERIOD: 10000000 USE_CUSTOM_SOLVER: True IMS_PER_BATCH: 32 BASE_LR: 0.0002 STEPS: (150000,) MAX_ITER: 180000 WARMUP_FACTOR: 1.0 WARMUP_ITERS: 10 WEIGHT_DECAY: 0.0001 OPTIMIZER: "ADAMW" BACKBONE_MULTIPLIER: 0.1 CLIP_GRADIENTS: ENABLED: True CLIP_TYPE: "full_model" CLIP_VALUE: 0.01 NORM_TYPE: 2.0 CUSTOM_MULTIPLIER: 0.1 CUSTOM_MULTIPLIER_NAME: ['reference_points', 'sampling_offsets'] INPUT: FORMAT: "RGB" MIN_SIZE_TRAIN: (480, 512, 544, 576, 608, 640, 672, 704, 736, 768, 800) CROP: ENABLED: True TYPE: "absolute_range" SIZE: (384, 600) CUSTOM_AUG: "DETR" TEST: DETECTIONS_PER_IMAGE: 300 DATALOADER: FILTER_EMPTY_ANNOTATIONS: False NUM_WORKERS: 4 SAMPLER_TRAIN: "RepeatFactorTrainingSampler" REPEAT_THRESHOLD: 0.001 OUTPUT_DIR: "output/Detic/auto" VERSION: 2