{ "_name_or_path": "dandelin/vilt-b32-mlm", "architectures": [ "ViltForQuestionAnswering" ], "attention_probs_dropout_prob": 0.0, "hidden_act": "gelu", "hidden_dropout_prob": 0.0, "hidden_size": 768, "id2label": { "0": "mouse", "1": "british", "2": "freezer", "3": "yes", "4": "nowhere", "5": "england", "6": "car", "7": "uk", "8": "cows", "9": "dog", "10": "room", "11": "us", "12": "on sidewalk", "13": "indoors", "14": "nothing", "15": "airport", "16": "usa", "17": "park", "18": "hallway", "19": "australia", "20": "windows", "21": "refrigerator", "22": "buildings", "23": "sun", "24": "living room", "25": "bus", "26": "in car", "27": "home", "28": "woods", "29": "inside", "30": "hotel", "31": "united states", "32": "fridge", "33": "smile", "34": "ground", "35": "america" }, "image_size": 384, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "airport": 15, "america": 35, "australia": 19, "british": 1, "buildings": 22, "bus": 25, "car": 6, "cows": 8, "dog": 9, "england": 5, "freezer": 2, "fridge": 32, "ground": 34, "hallway": 18, "home": 27, "hotel": 30, "in car": 26, "indoors": 13, "inside": 29, "living room": 24, "mouse": 0, "nothing": 14, "nowhere": 4, "on sidewalk": 12, "park": 17, "refrigerator": 21, "room": 10, "smile": 33, "sun": 23, "uk": 7, "united states": 31, "us": 11, "usa": 16, "windows": 20, "woods": 28, "yes": 3 }, "layer_norm_eps": 1e-12, "max_image_length": -1, "max_position_embeddings": 40, "modality_type_vocab_size": 2, "model_type": "vilt", "num_attention_heads": 12, "num_channels": 3, "num_hidden_layers": 12, "num_images": -1, "patch_size": 32, "qkv_bias": true, "tie_word_embeddings": false, "torch_dtype": "float32", "transformers_version": "4.40.2", "type_vocab_size": 2, "vocab_size": 30522 }