{ "_name_or_path": "microsoft/conditional-detr-resnet-50", "activation_dropout": 0.0, "activation_function": "relu", "architectures": [ "ConditionalDetrForObjectDetection" ], "attention_dropout": 0.0, "auxiliary_loss": false, "backbone": "resnet50", "backbone_config": null, "bbox_cost": 5, "bbox_loss_coefficient": 5, "class_cost": 2, "cls_loss_coefficient": 2, "d_model": 256, "decoder_attention_heads": 8, "decoder_ffn_dim": 2048, "decoder_layerdrop": 0.0, "decoder_layers": 6, "dice_loss_coefficient": 1, "dilation": false, "dropout": 0.1, "encoder_attention_heads": 8, "encoder_ffn_dim": 2048, "encoder_layerdrop": 0.0, "encoder_layers": 6, "focal_alpha": 0.25, "giou_cost": 2, "giou_loss_coefficient": 2, "id2label": { "0": "price", "1": "title", "2": "image" }, "init_std": 0.02, "init_xavier_std": 1.0, "is_encoder_decoder": true, "label2id": { "image": 2, "price": 0, "title": 1 }, "mask_loss_coefficient": 1, "max_position_embeddings": 1024, "model_type": "conditional_detr", "num_channels": 3, "num_hidden_layers": 6, "num_queries": 20, "position_embedding_type": "sine", "scale_embedding": false, "torch_dtype": "float32", "transformers_version": "4.30.0.dev0", "use_pretrained_backbone": true, "use_timm_backbone": true }