File size: 1,818 Bytes
f57daf4 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 |
{
"_name_or_path": "google/owlvit-base-patch32",
"architectures": [
"OwlViTForObjectDetection"
],
"id2label": {
"0": 6,
"1": 7,
"10": 16,
"11": 17,
"12": 18,
"13": 19,
"14": 20,
"15": 21,
"16": 22,
"17": 23,
"18": 24,
"19": 25,
"2": 8,
"20": 26,
"21": 27,
"22": 28,
"23": 29,
"24": 30,
"25": 31,
"26": 32,
"27": 33,
"28": 34,
"29": 37,
"3": 9,
"30": 38,
"31": 40,
"32": 41,
"33": 42,
"34": 43,
"35": 44,
"36": 45,
"37": 46,
"38": 47,
"39": 48,
"4": 10,
"5": 11,
"6": 12,
"7": 13,
"8": 14,
"9": 15
},
"initializer_factor": 1.0,
"label2id": {
"6": "0",
"7": "1",
"8": "2",
"9": "3",
"10": "4",
"11": "5",
"12": "6",
"13": "7",
"14": "8",
"15": "9",
"16": "10",
"17": "11",
"18": "12",
"19": "13",
"20": "14",
"21": "15",
"22": "16",
"23": "17",
"24": "18",
"25": "19",
"26": "20",
"27": "21",
"28": "22",
"29": "23",
"30": "24",
"31": "25",
"32": "26",
"33": "27",
"34": "28",
"37": "29",
"38": "30",
"40": "31",
"41": "32",
"42": "33",
"43": "34",
"44": "35",
"45": "36",
"46": "37",
"47": "38",
"48": "39"
},
"logit_scale_init_value": 2.6592,
"model_type": "owlvit",
"projection_dim": 512,
"text_config": {
"bos_token_id": 0,
"dropout": 0.0,
"eos_token_id": 2,
"max_length": 16,
"model_type": "owlvit_text_model",
"pad_token_id": 1
},
"text_config_dict": null,
"torch_dtype": "float32",
"transformers_version": "4.38.2",
"vision_config": {
"dropout": 0.0,
"model_type": "owlvit_vision_model"
},
"vision_config_dict": null
}
|