beit-sketch-classifier / config.json
kmewhort's picture
Training in progress, epoch 0
d4cb7ed
{
"_name_or_path": "microsoft/beit-base-patch16-224-pt22k-ft22k",
"architectures": [
"BeitForImageClassification"
],
"attention_probs_dropout_prob": 0.0,
"auxiliary_channels": 256,
"auxiliary_concat_input": false,
"auxiliary_loss_weight": 0.4,
"auxiliary_num_convs": 1,
"drop_path_rate": 0.1,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.0,
"hidden_size": 768,
"id2label": {
"0": "The Eiffel Tower",
"1": "The Great Wall of China",
"2": "The Mona Lisa",
"3": "aircraft carrier",
"4": "airplane",
"5": "alarm clock",
"6": "ambulance",
"7": "angel",
"8": "animal migration",
"9": "ant",
"10": "anvil",
"11": "apple",
"12": "arm",
"13": "asparagus",
"14": "axe",
"15": "backpack",
"16": "banana",
"17": "bandage",
"18": "barn",
"19": "baseball",
"20": "baseball bat",
"21": "basket",
"22": "basketball",
"23": "bat",
"24": "bathtub",
"25": "beach",
"26": "bear",
"27": "beard",
"28": "bed",
"29": "bee",
"30": "belt",
"31": "bench",
"32": "bicycle",
"33": "binoculars",
"34": "bird",
"35": "birthday cake",
"36": "blackberry",
"37": "blueberry",
"38": "book",
"39": "boomerang",
"40": "bottlecap",
"41": "bowtie",
"42": "bracelet",
"43": "brain",
"44": "bread",
"45": "bridge",
"46": "broccoli",
"47": "broom",
"48": "bucket",
"49": "bulldozer",
"50": "bus",
"51": "bush",
"52": "butterfly",
"53": "cactus",
"54": "cake",
"55": "calculator",
"56": "calendar",
"57": "camel",
"58": "camera",
"59": "camouflage",
"60": "campfire",
"61": "candle",
"62": "cannon",
"63": "canoe",
"64": "car",
"65": "carrot",
"66": "castle",
"67": "cat",
"68": "ceiling fan",
"69": "cell phone",
"70": "cello",
"71": "chair",
"72": "chandelier",
"73": "church",
"74": "circle",
"75": "clarinet",
"76": "clock",
"77": "cloud",
"78": "coffee cup",
"79": "compass",
"80": "computer",
"81": "cookie",
"82": "cooler",
"83": "couch",
"84": "cow",
"85": "crab",
"86": "crayon",
"87": "crocodile",
"88": "crown",
"89": "cruise ship",
"90": "cup",
"91": "diamond",
"92": "dishwasher",
"93": "diving board",
"94": "dog",
"95": "dolphin",
"96": "donut",
"97": "door",
"98": "dragon",
"99": "dresser",
"100": "drill",
"101": "drums",
"102": "duck",
"103": "dumbbell",
"104": "ear",
"105": "elbow",
"106": "elephant",
"107": "envelope",
"108": "eraser",
"109": "eye",
"110": "eyeglasses",
"111": "face",
"112": "fan",
"113": "feather",
"114": "fence",
"115": "finger",
"116": "fire hydrant",
"117": "fireplace",
"118": "firetruck",
"119": "fish",
"120": "flamingo",
"121": "flashlight",
"122": "flip flops",
"123": "floor lamp",
"124": "flower",
"125": "flying saucer",
"126": "foot",
"127": "fork",
"128": "frog",
"129": "frying pan",
"130": "garden",
"131": "garden hose",
"132": "giraffe",
"133": "goatee",
"134": "golf club",
"135": "grapes",
"136": "grass",
"137": "guitar",
"138": "hamburger",
"139": "hammer",
"140": "hand",
"141": "harp",
"142": "hat",
"143": "headphones",
"144": "hedgehog",
"145": "helicopter",
"146": "helmet",
"147": "hexagon",
"148": "hockey puck",
"149": "hockey stick",
"150": "horse",
"151": "hospital",
"152": "hot air balloon",
"153": "hot dog",
"154": "hot tub",
"155": "hourglass",
"156": "house",
"157": "house plant",
"158": "hurricane",
"159": "ice cream",
"160": "jacket",
"161": "jail",
"162": "kangaroo",
"163": "key",
"164": "keyboard",
"165": "knee",
"166": "knife",
"167": "ladder",
"168": "lantern",
"169": "laptop",
"170": "leaf",
"171": "leg",
"172": "light bulb",
"173": "lighter",
"174": "lighthouse",
"175": "lightning",
"176": "line",
"177": "lion",
"178": "lipstick",
"179": "lobster",
"180": "lollipop",
"181": "mailbox",
"182": "map",
"183": "marker",
"184": "matches",
"185": "megaphone",
"186": "mermaid",
"187": "microphone",
"188": "microwave",
"189": "monkey",
"190": "moon",
"191": "mosquito",
"192": "motorbike",
"193": "mountain",
"194": "mouse",
"195": "moustache",
"196": "mouth",
"197": "mug",
"198": "mushroom",
"199": "nail",
"200": "necklace",
"201": "nose",
"202": "ocean",
"203": "octagon",
"204": "octopus",
"205": "onion",
"206": "oven",
"207": "owl",
"208": "paint can",
"209": "paintbrush",
"210": "palm tree",
"211": "panda",
"212": "pants",
"213": "paper clip",
"214": "parachute",
"215": "parrot",
"216": "passport",
"217": "peanut",
"218": "pear",
"219": "peas",
"220": "pencil",
"221": "penguin",
"222": "piano",
"223": "pickup truck",
"224": "picture frame",
"225": "pig",
"226": "pillow",
"227": "pineapple",
"228": "pizza",
"229": "pliers",
"230": "police car",
"231": "pond",
"232": "pool",
"233": "popsicle",
"234": "postcard",
"235": "potato",
"236": "power outlet",
"237": "purse",
"238": "rabbit",
"239": "raccoon",
"240": "radio",
"241": "rain",
"242": "rainbow",
"243": "rake",
"244": "remote control",
"245": "rhinoceros",
"246": "rifle",
"247": "river",
"248": "roller coaster",
"249": "rollerskates",
"250": "sailboat",
"251": "sandwich",
"252": "saw",
"253": "saxophone",
"254": "school bus",
"255": "scissors",
"256": "scorpion",
"257": "screwdriver",
"258": "sea turtle",
"259": "see saw",
"260": "shark",
"261": "sheep",
"262": "shoe",
"263": "shorts",
"264": "shovel",
"265": "sink",
"266": "skateboard",
"267": "skull",
"268": "skyscraper",
"269": "sleeping bag",
"270": "smiley face",
"271": "snail",
"272": "snake",
"273": "snorkel",
"274": "snowflake",
"275": "snowman",
"276": "soccer ball",
"277": "sock",
"278": "speedboat",
"279": "spider",
"280": "spoon",
"281": "spreadsheet",
"282": "square",
"283": "squiggle",
"284": "squirrel",
"285": "stairs",
"286": "star",
"287": "steak",
"288": "stereo",
"289": "stethoscope",
"290": "stitches",
"291": "stop sign",
"292": "stove",
"293": "strawberry",
"294": "streetlight",
"295": "string bean",
"296": "submarine",
"297": "suitcase",
"298": "sun",
"299": "swan",
"300": "sweater",
"301": "swing set",
"302": "sword",
"303": "syringe",
"304": "t-shirt",
"305": "table",
"306": "teapot",
"307": "teddy-bear",
"308": "telephone",
"309": "television",
"310": "tennis racquet",
"311": "tent",
"312": "tiger",
"313": "toaster",
"314": "toe",
"315": "toilet",
"316": "tooth",
"317": "toothbrush",
"318": "toothpaste",
"319": "tornado",
"320": "tractor",
"321": "traffic light",
"322": "train",
"323": "tree",
"324": "triangle",
"325": "trombone",
"326": "truck",
"327": "trumpet",
"328": "umbrella",
"329": "underwear",
"330": "van",
"331": "vase",
"332": "violin",
"333": "washing machine",
"334": "watermelon",
"335": "waterslide",
"336": "whale",
"337": "wheel",
"338": "windmill",
"339": "wine bottle",
"340": "wine glass",
"341": "wristwatch",
"342": "yoga",
"343": "zebra",
"344": "zigzag"
},
"image_size": 224,
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"The Eiffel Tower": 0,
"The Great Wall of China": 1,
"The Mona Lisa": 2,
"aircraft carrier": 3,
"airplane": 4,
"alarm clock": 5,
"ambulance": 6,
"angel": 7,
"animal migration": 8,
"ant": 9,
"anvil": 10,
"apple": 11,
"arm": 12,
"asparagus": 13,
"axe": 14,
"backpack": 15,
"banana": 16,
"bandage": 17,
"barn": 18,
"baseball": 19,
"baseball bat": 20,
"basket": 21,
"basketball": 22,
"bat": 23,
"bathtub": 24,
"beach": 25,
"bear": 26,
"beard": 27,
"bed": 28,
"bee": 29,
"belt": 30,
"bench": 31,
"bicycle": 32,
"binoculars": 33,
"bird": 34,
"birthday cake": 35,
"blackberry": 36,
"blueberry": 37,
"book": 38,
"boomerang": 39,
"bottlecap": 40,
"bowtie": 41,
"bracelet": 42,
"brain": 43,
"bread": 44,
"bridge": 45,
"broccoli": 46,
"broom": 47,
"bucket": 48,
"bulldozer": 49,
"bus": 50,
"bush": 51,
"butterfly": 52,
"cactus": 53,
"cake": 54,
"calculator": 55,
"calendar": 56,
"camel": 57,
"camera": 58,
"camouflage": 59,
"campfire": 60,
"candle": 61,
"cannon": 62,
"canoe": 63,
"car": 64,
"carrot": 65,
"castle": 66,
"cat": 67,
"ceiling fan": 68,
"cell phone": 69,
"cello": 70,
"chair": 71,
"chandelier": 72,
"church": 73,
"circle": 74,
"clarinet": 75,
"clock": 76,
"cloud": 77,
"coffee cup": 78,
"compass": 79,
"computer": 80,
"cookie": 81,
"cooler": 82,
"couch": 83,
"cow": 84,
"crab": 85,
"crayon": 86,
"crocodile": 87,
"crown": 88,
"cruise ship": 89,
"cup": 90,
"diamond": 91,
"dishwasher": 92,
"diving board": 93,
"dog": 94,
"dolphin": 95,
"donut": 96,
"door": 97,
"dragon": 98,
"dresser": 99,
"drill": 100,
"drums": 101,
"duck": 102,
"dumbbell": 103,
"ear": 104,
"elbow": 105,
"elephant": 106,
"envelope": 107,
"eraser": 108,
"eye": 109,
"eyeglasses": 110,
"face": 111,
"fan": 112,
"feather": 113,
"fence": 114,
"finger": 115,
"fire hydrant": 116,
"fireplace": 117,
"firetruck": 118,
"fish": 119,
"flamingo": 120,
"flashlight": 121,
"flip flops": 122,
"floor lamp": 123,
"flower": 124,
"flying saucer": 125,
"foot": 126,
"fork": 127,
"frog": 128,
"frying pan": 129,
"garden": 130,
"garden hose": 131,
"giraffe": 132,
"goatee": 133,
"golf club": 134,
"grapes": 135,
"grass": 136,
"guitar": 137,
"hamburger": 138,
"hammer": 139,
"hand": 140,
"harp": 141,
"hat": 142,
"headphones": 143,
"hedgehog": 144,
"helicopter": 145,
"helmet": 146,
"hexagon": 147,
"hockey puck": 148,
"hockey stick": 149,
"horse": 150,
"hospital": 151,
"hot air balloon": 152,
"hot dog": 153,
"hot tub": 154,
"hourglass": 155,
"house": 156,
"house plant": 157,
"hurricane": 158,
"ice cream": 159,
"jacket": 160,
"jail": 161,
"kangaroo": 162,
"key": 163,
"keyboard": 164,
"knee": 165,
"knife": 166,
"ladder": 167,
"lantern": 168,
"laptop": 169,
"leaf": 170,
"leg": 171,
"light bulb": 172,
"lighter": 173,
"lighthouse": 174,
"lightning": 175,
"line": 176,
"lion": 177,
"lipstick": 178,
"lobster": 179,
"lollipop": 180,
"mailbox": 181,
"map": 182,
"marker": 183,
"matches": 184,
"megaphone": 185,
"mermaid": 186,
"microphone": 187,
"microwave": 188,
"monkey": 189,
"moon": 190,
"mosquito": 191,
"motorbike": 192,
"mountain": 193,
"mouse": 194,
"moustache": 195,
"mouth": 196,
"mug": 197,
"mushroom": 198,
"nail": 199,
"necklace": 200,
"nose": 201,
"ocean": 202,
"octagon": 203,
"octopus": 204,
"onion": 205,
"oven": 206,
"owl": 207,
"paint can": 208,
"paintbrush": 209,
"palm tree": 210,
"panda": 211,
"pants": 212,
"paper clip": 213,
"parachute": 214,
"parrot": 215,
"passport": 216,
"peanut": 217,
"pear": 218,
"peas": 219,
"pencil": 220,
"penguin": 221,
"piano": 222,
"pickup truck": 223,
"picture frame": 224,
"pig": 225,
"pillow": 226,
"pineapple": 227,
"pizza": 228,
"pliers": 229,
"police car": 230,
"pond": 231,
"pool": 232,
"popsicle": 233,
"postcard": 234,
"potato": 235,
"power outlet": 236,
"purse": 237,
"rabbit": 238,
"raccoon": 239,
"radio": 240,
"rain": 241,
"rainbow": 242,
"rake": 243,
"remote control": 244,
"rhinoceros": 245,
"rifle": 246,
"river": 247,
"roller coaster": 248,
"rollerskates": 249,
"sailboat": 250,
"sandwich": 251,
"saw": 252,
"saxophone": 253,
"school bus": 254,
"scissors": 255,
"scorpion": 256,
"screwdriver": 257,
"sea turtle": 258,
"see saw": 259,
"shark": 260,
"sheep": 261,
"shoe": 262,
"shorts": 263,
"shovel": 264,
"sink": 265,
"skateboard": 266,
"skull": 267,
"skyscraper": 268,
"sleeping bag": 269,
"smiley face": 270,
"snail": 271,
"snake": 272,
"snorkel": 273,
"snowflake": 274,
"snowman": 275,
"soccer ball": 276,
"sock": 277,
"speedboat": 278,
"spider": 279,
"spoon": 280,
"spreadsheet": 281,
"square": 282,
"squiggle": 283,
"squirrel": 284,
"stairs": 285,
"star": 286,
"steak": 287,
"stereo": 288,
"stethoscope": 289,
"stitches": 290,
"stop sign": 291,
"stove": 292,
"strawberry": 293,
"streetlight": 294,
"string bean": 295,
"submarine": 296,
"suitcase": 297,
"sun": 298,
"swan": 299,
"sweater": 300,
"swing set": 301,
"sword": 302,
"syringe": 303,
"t-shirt": 304,
"table": 305,
"teapot": 306,
"teddy-bear": 307,
"telephone": 308,
"television": 309,
"tennis racquet": 310,
"tent": 311,
"tiger": 312,
"toaster": 313,
"toe": 314,
"toilet": 315,
"tooth": 316,
"toothbrush": 317,
"toothpaste": 318,
"tornado": 319,
"tractor": 320,
"traffic light": 321,
"train": 322,
"tree": 323,
"triangle": 324,
"trombone": 325,
"truck": 326,
"trumpet": 327,
"umbrella": 328,
"underwear": 329,
"van": 330,
"vase": 331,
"violin": 332,
"washing machine": 333,
"watermelon": 334,
"waterslide": 335,
"whale": 336,
"wheel": 337,
"windmill": 338,
"wine bottle": 339,
"wine glass": 340,
"wristwatch": 341,
"yoga": 342,
"zebra": 343,
"zigzag": 344
},
"layer_norm_eps": 1e-12,
"layer_scale_init_value": 0.1,
"model_type": "beit",
"num_attention_heads": 12,
"num_channels": 3,
"num_hidden_layers": 12,
"out_indices": [
3,
5,
7,
11
],
"patch_size": 16,
"pool_scales": [
1,
2,
3,
6
],
"problem_type": "single_label_classification",
"semantic_loss_ignore_index": 255,
"torch_dtype": "float32",
"transformers_version": "4.25.1",
"use_absolute_position_embeddings": false,
"use_auxiliary_head": true,
"use_mask_token": false,
"use_mean_pooling": true,
"use_relative_position_bias": true,
"use_shared_relative_position_bias": false,
"vocab_size": 8192
}