{ "_name_or_path": "microsoft/beit-base-patch16-224-pt22k-ft22k", "architectures": [ "BeitForImageClassification" ], "attention_probs_dropout_prob": 0.0, "auxiliary_channels": 256, "auxiliary_concat_input": false, "auxiliary_loss_weight": 0.4, "auxiliary_num_convs": 1, "drop_path_rate": 0.1, "hidden_act": "gelu", "hidden_dropout_prob": 0.0, "hidden_size": 768, "id2label": { "0": "The Eiffel Tower", "1": "The Great Wall of China", "2": "The Mona Lisa", "3": "aircraft carrier", "4": "airplane", "5": "alarm clock", "6": "ambulance", "7": "angel", "8": "animal migration", "9": "ant", "10": "anvil", "11": "apple", "12": "arm", "13": "asparagus", "14": "axe", "15": "backpack", "16": "banana", "17": "bandage", "18": "barn", "19": "baseball", "20": "baseball bat", "21": "basket", "22": "basketball", "23": "bat", "24": "bathtub", "25": "beach", "26": "bear", "27": "beard", "28": "bed", "29": "bee", "30": "belt", "31": "bench", "32": "bicycle", "33": "binoculars", "34": "bird", "35": "birthday cake", "36": "blackberry", "37": "blueberry", "38": "book", "39": "boomerang", "40": "bottlecap", "41": "bowtie", "42": "bracelet", "43": "brain", "44": "bread", "45": "bridge", "46": "broccoli", "47": "broom", "48": "bucket", "49": "bulldozer", "50": "bus", "51": "bush", "52": "butterfly", "53": "cactus", "54": "cake", "55": "calculator", "56": "calendar", "57": "camel", "58": "camera", "59": "camouflage", "60": "campfire", "61": "candle", "62": "cannon", "63": "canoe", "64": "car", "65": "carrot", "66": "castle", "67": "cat", "68": "ceiling fan", "69": "cell phone", "70": "cello", "71": "chair", "72": "chandelier", "73": "church", "74": "circle", "75": "clarinet", "76": "clock", "77": "cloud", "78": "coffee cup", "79": "compass", "80": "computer", "81": "cookie", "82": "cooler", "83": "couch", "84": "cow", "85": "crab", "86": "crayon", "87": "crocodile", "88": "crown", "89": "cruise ship", "90": "cup", "91": "diamond", "92": "dishwasher", "93": "diving board", "94": "dog", "95": "dolphin", "96": "donut", "97": "door", "98": "dragon", "99": "dresser", "100": "drill", "101": "drums", "102": "duck", "103": "dumbbell", "104": "ear", "105": "elbow", "106": "elephant", "107": "envelope", "108": "eraser", "109": "eye", "110": "eyeglasses", "111": "face", "112": "fan", "113": "feather", "114": "fence", "115": "finger", "116": "fire hydrant", "117": "fireplace", "118": "firetruck", "119": "fish", "120": "flamingo", "121": "flashlight", "122": "flip flops", "123": "floor lamp", "124": "flower", "125": "flying saucer", "126": "foot", "127": "fork", "128": "frog", "129": "frying pan", "130": "garden", "131": "garden hose", "132": "giraffe", "133": "goatee", "134": "golf club", "135": "grapes", "136": "grass", "137": "guitar", "138": "hamburger", "139": "hammer", "140": "hand", "141": "harp", "142": "hat", "143": "headphones", "144": "hedgehog", "145": "helicopter", "146": "helmet", "147": "hexagon", "148": "hockey puck", "149": "hockey stick", "150": "horse", "151": "hospital", "152": "hot air balloon", "153": "hot dog", "154": "hot tub", "155": "hourglass", "156": "house", "157": "house plant", "158": "hurricane", "159": "ice cream", "160": "jacket", "161": "jail", "162": "kangaroo", "163": "key", "164": "keyboard", "165": "knee", "166": "knife", "167": "ladder", "168": "lantern", "169": "laptop", "170": "leaf", "171": "leg", "172": "light bulb", "173": "lighter", "174": "lighthouse", "175": "lightning", "176": "line", "177": "lion", "178": "lipstick", "179": "lobster", "180": "lollipop", "181": "mailbox", "182": "map", "183": "marker", "184": "matches", "185": "megaphone", "186": "mermaid", "187": "microphone", "188": "microwave", "189": "monkey", "190": "moon", "191": "mosquito", "192": "motorbike", "193": "mountain", "194": "mouse", "195": "moustache", "196": "mouth", "197": "mug", "198": "mushroom", "199": "nail", "200": "necklace", "201": "nose", "202": "ocean", "203": "octagon", "204": "octopus", "205": "onion", "206": "oven", "207": "owl", "208": "paint can", "209": "paintbrush", "210": "palm tree", "211": "panda", "212": "pants", "213": "paper clip", "214": "parachute", "215": "parrot", "216": "passport", "217": "peanut", "218": "pear", "219": "peas", "220": "pencil", "221": "penguin", "222": "piano", "223": "pickup truck", "224": "picture frame", "225": "pig", "226": "pillow", "227": "pineapple", "228": "pizza", "229": "pliers", "230": "police car", "231": "pond", "232": "pool", "233": "popsicle", "234": "postcard", "235": "potato", "236": "power outlet", "237": "purse", "238": "rabbit", "239": "raccoon", "240": "radio", "241": "rain", "242": "rainbow", "243": "rake", "244": "remote control", "245": "rhinoceros", "246": "rifle", "247": "river", "248": "roller coaster", "249": "rollerskates", "250": "sailboat", "251": "sandwich", "252": "saw", "253": "saxophone", "254": "school bus", "255": "scissors", "256": "scorpion", "257": "screwdriver", "258": "sea turtle", "259": "see saw", "260": "shark", "261": "sheep", "262": "shoe", "263": "shorts", "264": "shovel", "265": "sink", "266": "skateboard", "267": "skull", "268": "skyscraper", "269": "sleeping bag", "270": "smiley face", "271": "snail", "272": "snake", "273": "snorkel", "274": "snowflake", "275": "snowman", "276": "soccer ball", "277": "sock", "278": "speedboat", "279": "spider", "280": "spoon", "281": "spreadsheet", "282": "square", "283": "squiggle", "284": "squirrel", "285": "stairs", "286": "star", "287": "steak", "288": "stereo", "289": "stethoscope", "290": "stitches", "291": "stop sign", "292": "stove", "293": "strawberry", "294": "streetlight", "295": "string bean", "296": "submarine", "297": "suitcase", "298": "sun", "299": "swan", "300": "sweater", "301": "swing set", "302": "sword", "303": "syringe", "304": "t-shirt", "305": "table", "306": "teapot", "307": "teddy-bear", "308": "telephone", "309": "television", "310": "tennis racquet", "311": "tent", "312": "tiger", "313": "toaster", "314": "toe", "315": "toilet", "316": "tooth", "317": "toothbrush", "318": "toothpaste", "319": "tornado", "320": "tractor", "321": "traffic light", "322": "train", "323": "tree", "324": "triangle", "325": "trombone", "326": "truck", "327": "trumpet", "328": "umbrella", "329": "underwear", "330": "van", "331": "vase", "332": "violin", "333": "washing machine", "334": "watermelon", "335": "waterslide", "336": "whale", "337": "wheel", "338": "windmill", "339": "wine bottle", "340": "wine glass", "341": "wristwatch", "342": "yoga", "343": "zebra", "344": "zigzag" }, "image_size": 224, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "The Eiffel Tower": 0, "The Great Wall of China": 1, "The Mona Lisa": 2, "aircraft carrier": 3, "airplane": 4, "alarm clock": 5, "ambulance": 6, "angel": 7, "animal migration": 8, "ant": 9, "anvil": 10, "apple": 11, "arm": 12, "asparagus": 13, "axe": 14, "backpack": 15, "banana": 16, "bandage": 17, "barn": 18, "baseball": 19, "baseball bat": 20, "basket": 21, "basketball": 22, "bat": 23, "bathtub": 24, "beach": 25, "bear": 26, "beard": 27, "bed": 28, "bee": 29, "belt": 30, "bench": 31, "bicycle": 32, "binoculars": 33, "bird": 34, "birthday cake": 35, "blackberry": 36, "blueberry": 37, "book": 38, "boomerang": 39, "bottlecap": 40, "bowtie": 41, "bracelet": 42, "brain": 43, "bread": 44, "bridge": 45, "broccoli": 46, "broom": 47, "bucket": 48, "bulldozer": 49, "bus": 50, "bush": 51, "butterfly": 52, "cactus": 53, "cake": 54, "calculator": 55, "calendar": 56, "camel": 57, "camera": 58, "camouflage": 59, "campfire": 60, "candle": 61, "cannon": 62, "canoe": 63, "car": 64, "carrot": 65, "castle": 66, "cat": 67, "ceiling fan": 68, "cell phone": 69, "cello": 70, "chair": 71, "chandelier": 72, "church": 73, "circle": 74, "clarinet": 75, "clock": 76, "cloud": 77, "coffee cup": 78, "compass": 79, "computer": 80, "cookie": 81, "cooler": 82, "couch": 83, "cow": 84, "crab": 85, "crayon": 86, "crocodile": 87, "crown": 88, "cruise ship": 89, "cup": 90, "diamond": 91, "dishwasher": 92, "diving board": 93, "dog": 94, "dolphin": 95, "donut": 96, "door": 97, "dragon": 98, "dresser": 99, "drill": 100, "drums": 101, "duck": 102, "dumbbell": 103, "ear": 104, "elbow": 105, "elephant": 106, "envelope": 107, "eraser": 108, "eye": 109, "eyeglasses": 110, "face": 111, "fan": 112, "feather": 113, "fence": 114, "finger": 115, "fire hydrant": 116, "fireplace": 117, "firetruck": 118, "fish": 119, "flamingo": 120, "flashlight": 121, "flip flops": 122, "floor lamp": 123, "flower": 124, "flying saucer": 125, "foot": 126, "fork": 127, "frog": 128, "frying pan": 129, "garden": 130, "garden hose": 131, "giraffe": 132, "goatee": 133, "golf club": 134, "grapes": 135, "grass": 136, "guitar": 137, "hamburger": 138, "hammer": 139, "hand": 140, "harp": 141, "hat": 142, "headphones": 143, "hedgehog": 144, "helicopter": 145, "helmet": 146, "hexagon": 147, "hockey puck": 148, "hockey stick": 149, "horse": 150, "hospital": 151, "hot air balloon": 152, "hot dog": 153, "hot tub": 154, "hourglass": 155, "house": 156, "house plant": 157, "hurricane": 158, "ice cream": 159, "jacket": 160, "jail": 161, "kangaroo": 162, "key": 163, "keyboard": 164, "knee": 165, "knife": 166, "ladder": 167, "lantern": 168, "laptop": 169, "leaf": 170, "leg": 171, "light bulb": 172, "lighter": 173, "lighthouse": 174, "lightning": 175, "line": 176, "lion": 177, "lipstick": 178, "lobster": 179, "lollipop": 180, "mailbox": 181, "map": 182, "marker": 183, "matches": 184, "megaphone": 185, "mermaid": 186, "microphone": 187, "microwave": 188, "monkey": 189, "moon": 190, "mosquito": 191, "motorbike": 192, "mountain": 193, "mouse": 194, "moustache": 195, "mouth": 196, "mug": 197, "mushroom": 198, "nail": 199, "necklace": 200, "nose": 201, "ocean": 202, "octagon": 203, "octopus": 204, "onion": 205, "oven": 206, "owl": 207, "paint can": 208, "paintbrush": 209, "palm tree": 210, "panda": 211, "pants": 212, "paper clip": 213, "parachute": 214, "parrot": 215, "passport": 216, "peanut": 217, "pear": 218, "peas": 219, "pencil": 220, "penguin": 221, "piano": 222, "pickup truck": 223, "picture frame": 224, "pig": 225, "pillow": 226, "pineapple": 227, "pizza": 228, "pliers": 229, "police car": 230, "pond": 231, "pool": 232, "popsicle": 233, "postcard": 234, "potato": 235, "power outlet": 236, "purse": 237, "rabbit": 238, "raccoon": 239, "radio": 240, "rain": 241, "rainbow": 242, "rake": 243, "remote control": 244, "rhinoceros": 245, "rifle": 246, "river": 247, "roller coaster": 248, "rollerskates": 249, "sailboat": 250, "sandwich": 251, "saw": 252, "saxophone": 253, "school bus": 254, "scissors": 255, "scorpion": 256, "screwdriver": 257, "sea turtle": 258, "see saw": 259, "shark": 260, "sheep": 261, "shoe": 262, "shorts": 263, "shovel": 264, "sink": 265, "skateboard": 266, "skull": 267, "skyscraper": 268, "sleeping bag": 269, "smiley face": 270, "snail": 271, "snake": 272, "snorkel": 273, "snowflake": 274, "snowman": 275, "soccer ball": 276, "sock": 277, "speedboat": 278, "spider": 279, "spoon": 280, "spreadsheet": 281, "square": 282, "squiggle": 283, "squirrel": 284, "stairs": 285, "star": 286, "steak": 287, "stereo": 288, "stethoscope": 289, "stitches": 290, "stop sign": 291, "stove": 292, "strawberry": 293, "streetlight": 294, "string bean": 295, "submarine": 296, "suitcase": 297, "sun": 298, "swan": 299, "sweater": 300, "swing set": 301, "sword": 302, "syringe": 303, "t-shirt": 304, "table": 305, "teapot": 306, "teddy-bear": 307, "telephone": 308, "television": 309, "tennis racquet": 310, "tent": 311, "tiger": 312, "toaster": 313, "toe": 314, "toilet": 315, "tooth": 316, "toothbrush": 317, "toothpaste": 318, "tornado": 319, "tractor": 320, "traffic light": 321, "train": 322, "tree": 323, "triangle": 324, "trombone": 325, "truck": 326, "trumpet": 327, "umbrella": 328, "underwear": 329, "van": 330, "vase": 331, "violin": 332, "washing machine": 333, "watermelon": 334, "waterslide": 335, "whale": 336, "wheel": 337, "windmill": 338, "wine bottle": 339, "wine glass": 340, "wristwatch": 341, "yoga": 342, "zebra": 343, "zigzag": 344 }, "layer_norm_eps": 1e-12, "layer_scale_init_value": 0.1, "model_type": "beit", "num_attention_heads": 12, "num_channels": 3, "num_hidden_layers": 12, "out_indices": [ 3, 5, 7, 11 ], "patch_size": 16, "pool_scales": [ 1, 2, 3, 6 ], "problem_type": "single_label_classification", "semantic_loss_ignore_index": 255, "torch_dtype": "float32", "transformers_version": "4.25.1", "use_absolute_position_embeddings": false, "use_auxiliary_head": true, "use_mask_token": false, "use_mean_pooling": true, "use_relative_position_bias": true, "use_shared_relative_position_bias": false, "vocab_size": 8192 }