{ "_name_or_path": "google/owlvit-base-patch32", "architectures": [ "OwlViTForObjectDetection" ], "id2label": { "0": 6, "1": 7, "10": 16, "11": 17, "12": 18, "13": 19, "14": 20, "15": 21, "16": 22, "17": 23, "18": 24, "19": 25, "2": 8, "20": 26, "21": 27, "22": 28, "23": 29, "24": 30, "25": 31, "26": 32, "27": 33, "28": 34, "29": 37, "3": 9, "30": 38, "31": 40, "32": 41, "33": 42, "34": 43, "35": 44, "36": 45, "37": 46, "38": 47, "39": 48, "4": 10, "5": 11, "6": 12, "7": 13, "8": 14, "9": 15 }, "initializer_factor": 1.0, "label2id": { "6": "0", "7": "1", "8": "2", "9": "3", "10": "4", "11": "5", "12": "6", "13": "7", "14": "8", "15": "9", "16": "10", "17": "11", "18": "12", "19": "13", "20": "14", "21": "15", "22": "16", "23": "17", "24": "18", "25": "19", "26": "20", "27": "21", "28": "22", "29": "23", "30": "24", "31": "25", "32": "26", "33": "27", "34": "28", "37": "29", "38": "30", "40": "31", "41": "32", "42": "33", "43": "34", "44": "35", "45": "36", "46": "37", "47": "38", "48": "39" }, "logit_scale_init_value": 2.6592, "model_type": "owlvit", "projection_dim": 512, "text_config": { "bos_token_id": 0, "dropout": 0.0, "eos_token_id": 2, "max_length": 16, "model_type": "owlvit_text_model", "pad_token_id": 1 }, "text_config_dict": null, "torch_dtype": "float32", "transformers_version": "4.38.2", "vision_config": { "dropout": 0.0, "model_type": "owlvit_vision_model" }, "vision_config_dict": null }