{ "_name_or_path": "google/owlvit-base-patch32", "architectures": [ "OwlViTForObjectDetection" ], "id2label": { "0": 1, "1": 3, "10": 21, "11": 22, "12": 23, "13": 24, "14": 25, "15": 26, "16": 28, "17": 29, "18": 30, "19": 31, "2": 7, "20": 32, "21": 33, "22": 34, "23": 35, "24": 36, "25": 37, "26": 38, "27": 39, "28": 40, "29": 41, "3": 9, "30": 42, "31": 43, "32": 44, "33": 45, "34": 46, "35": 47, "36": 48, "37": 50, "38": 51, "39": 52, "4": 11, "40": 53, "41": 57, "42": 58, "43": 59, "44": 60, "45": 61, "46": 62, "47": 63, "48": 66, "49": 67, "5": 13, "50": 68, "51": 70, "52": 72, "53": 73, "54": 74, "55": 75, "56": 76, "57": 77, "58": 78, "59": 80, "6": 14, "60": 81, "61": 82, "62": 83, "63": 84, "64": 85, "65": 86, "66": 87, "67": 88, "68": 89, "69": 90, "7": 16, "70": 91, "71": 92, "72": 93, "73": 94, "74": 95, "75": 96, "76": 97, "77": 98, "78": 99, "79": 100, "8": 19, "80": 101, "81": 102, "82": 103, "83": 104, "84": 105, "9": 20 }, "initializer_factor": 1.0, "label2id": { "1": "0", "3": "1", "7": "2", "9": "3", "11": "4", "13": "5", "14": "6", "16": "7", "19": "8", "20": "9", "21": "10", "22": "11", "23": "12", "24": "13", "25": "14", "26": "15", "28": "16", "29": "17", "30": "18", "31": "19", "32": "20", "33": "21", "34": "22", "35": "23", "36": "24", "37": "25", "38": "26", "39": "27", "40": "28", "41": "29", "42": "30", "43": "31", "44": "32", "45": "33", "46": "34", "47": "35", "48": "36", "50": "37", "51": "38", "52": "39", "53": "40", "57": "41", "58": "42", "59": "43", "60": "44", "61": "45", "62": "46", "63": "47", "66": "48", "67": "49", "68": "50", "70": "51", "72": "52", "73": "53", "74": "54", "75": "55", "76": "56", "77": "57", "78": "58", "80": "59", "81": "60", "82": "61", "83": "62", "84": "63", "85": "64", "86": "65", "87": "66", "88": "67", "89": "68", "90": "69", "91": "70", "92": "71", "93": "72", "94": "73", "95": "74", "96": "75", "97": "76", "98": "77", "99": "78", "100": "79", "101": "80", "102": "81", "103": "82", "104": "83", "105": "84" }, "logit_scale_init_value": 2.6592, "model_type": "owlvit", "projection_dim": 512, "text_config": { "bos_token_id": 0, "dropout": 0.0, "eos_token_id": 2, "max_length": 16, "model_type": "owlvit_text_model", "pad_token_id": 1 }, "text_config_dict": null, "torch_dtype": "float32", "transformers_version": "4.41.2", "vision_config": { "dropout": 0.0, "model_type": "owlvit_vision_model" }, "vision_config_dict": null }