{ | |
"_name_or_path": "rafaelpadilla/porting_rt_detr", | |
"act_encoder": "silu", | |
"architectures": [ | |
"RTDetrModel" | |
], | |
"backbone_config": { | |
"backbone": "resnet50d", | |
"freeze_batch_norm_2d": true, | |
"model_type": "timm_backbone", | |
"out_indices": [ | |
2, | |
3, | |
4 | |
] | |
}, | |
"batch_norm_eps": 1e-05, | |
"box_noise_scale": 1.0, | |
"dim_feedforward": 1024, | |
"dropout": 0.0, | |
"encode_proj_layers": [ | |
2 | |
], | |
"encoder_attention_heads": 8, | |
"eos_coefficient": 0.1, | |
"eval_idx": -1, | |
"eval_size": null, | |
"eval_spatial_size": [ | |
640, | |
640 | |
], | |
"feat_channels": [ | |
256, | |
256, | |
256 | |
], | |
"feat_strides": [ | |
8, | |
16, | |
32 | |
], | |
"focal_loss_alpha": 0.75, | |
"focal_loss_gamma": 2.0, | |
"hidden_dim": 256, | |
"id2label": { | |
"0": "person", | |
"1": "bicycle", | |
"2": "car", | |
"3": "motorcycle", | |
"4": "airplane", | |
"5": "bus", | |
"6": "train", | |
"7": "truck", | |
"8": "boat", | |
"9": "traffic light", | |
"10": "fire hydrant", | |
"11": "stop sign", | |
"12": "parking meter", | |
"13": "bench", | |
"14": "bird", | |
"15": "cat", | |
"16": "dog", | |
"17": "horse", | |
"18": "sheep", | |
"19": "cow", | |
"20": "elephant", | |
"21": "bear", | |
"22": "zebra", | |
"23": "giraffe", | |
"24": "backpack", | |
"25": "umbrella", | |
"26": "handbag", | |
"27": "tie", | |
"28": "suitcase", | |
"29": "frisbee", | |
"30": "skis", | |
"31": "snowboard", | |
"32": "sports ball", | |
"33": "kite", | |
"34": "baseball bat", | |
"35": "baseball glove", | |
"36": "skateboard", | |
"37": "surfboard", | |
"38": "tennis racket", | |
"39": "bottle", | |
"40": "wine glass", | |
"41": "cup", | |
"42": "fork", | |
"43": "knife", | |
"44": "spoon", | |
"45": "bowl", | |
"46": "banana", | |
"47": "apple", | |
"48": "sandwich", | |
"49": "orange", | |
"50": "broccoli", | |
"51": "carrot", | |
"52": "hot dog", | |
"53": "pizza", | |
"54": "donut", | |
"55": "cake", | |
"56": "chair", | |
"57": "couch", | |
"58": "potted plant", | |
"59": "bed", | |
"60": "dining table", | |
"61": "toilet", | |
"62": "tv", | |
"63": "laptop", | |
"64": "mouse", | |
"65": "remote", | |
"66": "keyboard", | |
"67": "cell phone", | |
"68": "microwave", | |
"69": "oven", | |
"70": "toaster", | |
"71": "sink", | |
"72": "refrigerator", | |
"73": "book", | |
"74": "clock", | |
"75": "vase", | |
"76": "scissors", | |
"77": "teddy bear", | |
"78": "hair drier", | |
"79": "toothbrush" | |
}, | |
"image_size": [ | |
640, | |
640 | |
], | |
"initializer_range": 0.02, | |
"label2id": { | |
"airplane": 4, | |
"apple": 47, | |
"backpack": 24, | |
"banana": 46, | |
"baseball bat": 34, | |
"baseball glove": 35, | |
"bear": 21, | |
"bed": 59, | |
"bench": 13, | |
"bicycle": 1, | |
"bird": 14, | |
"boat": 8, | |
"book": 73, | |
"bottle": 39, | |
"bowl": 45, | |
"broccoli": 50, | |
"bus": 5, | |
"cake": 55, | |
"car": 2, | |
"carrot": 51, | |
"cat": 15, | |
"cell phone": 67, | |
"chair": 56, | |
"clock": 74, | |
"couch": 57, | |
"cow": 19, | |
"cup": 41, | |
"dining table": 60, | |
"dog": 16, | |
"donut": 54, | |
"elephant": 20, | |
"fire hydrant": 10, | |
"fork": 42, | |
"frisbee": 29, | |
"giraffe": 23, | |
"hair drier": 78, | |
"handbag": 26, | |
"horse": 17, | |
"hot dog": 52, | |
"keyboard": 66, | |
"kite": 33, | |
"knife": 43, | |
"laptop": 63, | |
"microwave": 68, | |
"motorcycle": 3, | |
"mouse": 64, | |
"orange": 49, | |
"oven": 69, | |
"parking meter": 12, | |
"person": 0, | |
"pizza": 53, | |
"potted plant": 58, | |
"refrigerator": 72, | |
"remote": 65, | |
"sandwich": 48, | |
"scissors": 76, | |
"sheep": 18, | |
"sink": 71, | |
"skateboard": 36, | |
"skis": 30, | |
"snowboard": 31, | |
"spoon": 44, | |
"sports ball": 32, | |
"stop sign": 11, | |
"suitcase": 28, | |
"surfboard": 37, | |
"teddy bear": 77, | |
"tennis racket": 38, | |
"tie": 27, | |
"toaster": 70, | |
"toilet": 61, | |
"toothbrush": 79, | |
"traffic light": 9, | |
"train": 6, | |
"truck": 7, | |
"tv": 62, | |
"umbrella": 25, | |
"vase": 75, | |
"wine glass": 40, | |
"zebra": 22 | |
}, | |
"label_noise_ratio": 0.5, | |
"layer_norm_eps": 1e-05, | |
"learnt_init_query": false, | |
"matcher_alpha": 0.25, | |
"matcher_bbox_cost": 5.0, | |
"matcher_class_cost": 2.0, | |
"matcher_gamma": 2.0, | |
"matcher_giou_cost": 2.0, | |
"model_type": "rt_detr", | |
"normalize_before": false, | |
"num_classes": 80, | |
"num_decoder_layers": 6, | |
"num_decoder_points": 4, | |
"num_denoising": 100, | |
"num_encoder_layers": 1, | |
"num_levels": 3, | |
"num_queries": 300, | |
"pe_temperature": 10000, | |
"torch_dtype": "float32", | |
"transformers_version": "4.36.0.dev0", | |
"use_aux_loss": true, | |
"use_encoder_idx": [ | |
2 | |
], | |
"use_focal_loss": true, | |
"weight_loss_bbox": 5.0, | |
"weight_loss_giou": 2.0, | |
"weight_loss_vfl": 1.0 | |
} | |