{ "_name_or_path": "dandelin/vilt-b32-mlm", "architectures": [ "ViltForQuestionAnswering" ], "attention_probs_dropout_prob": 0.0, "hidden_act": "gelu", "hidden_dropout_prob": 0.0, "hidden_size": 768, "id2label": { "0": "hotel _gulmohar_grand", "1": "yes", "2": "paradise_grand", "3": "20-250_rupees", "4": "agnigarh_hill", "5": "1229", "6": "jorhat", "7": "dhekiakhowa_bormamghar", "8": "1897", "9": "1653", "10": "hajo_powa_mecca", "11": "6:00-21:00", "12": "shanti_ashram", "13": "30_rupees", "14": "1319", "15": "1725", "16": "1528", "17": "sonitpur", "18": "mayflower_hotel", "19": "1765", "20": "6:00-17:30", "21": "anytime", "22": "6:00-22:00", "23": "50", "24": "06:00-18:00", "25": "tirupati_balaji_temple ", "26": "free", "27": "hotel_kalita_palace", "28": "7:00-19:00", "29": "auniati_satra", "30": "garamur_satra", "31": "bordowa_than", "32": "mist_blew_hotel", "33": "hotel_krc", "34": "1998", "35": "1794", "36": "sivasagar", "37": "negheriting_shiva_dol", "38": "guwahati", "39": "samaguri_sattra", "40": "siva_dol", "41": "1468", "42": "day_time", "43": "majuli" }, "image_size": 384, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "06:00-18:00": 24, "1229": 5, "1319": 14, "1468": 41, "1528": 16, "1653": 9, "1725": 15, "1765": 19, "1794": 35, "1897": 8, "1998": 34, "20-250_rupees": 3, "30_rupees": 13, "50": 23, "6:00-17:30": 20, "6:00-21:00": 11, "6:00-22:00": 22, "7:00-19:00": 28, "agnigarh_hill": 4, "anytime": 21, "auniati_satra": 29, "bordowa_than": 31, "day_time": 42, "dhekiakhowa_bormamghar": 7, "free": 26, "garamur_satra": 30, "guwahati": 38, "hajo_powa_mecca": 10, "hotel _gulmohar_grand": 0, "hotel_kalita_palace": 27, "hotel_krc": 33, "jorhat": 6, "majuli": 43, "mayflower_hotel": 18, "mist_blew_hotel": 32, "negheriting_shiva_dol": 37, "paradise_grand": 2, "samaguri_sattra": 39, "shanti_ashram": 12, "siva_dol": 40, "sivasagar": 36, "sonitpur": 17, "tirupati_balaji_temple ": 25, "yes": 1 }, "layer_norm_eps": 1e-12, "max_image_length": -1, "max_position_embeddings": 40, "modality_type_vocab_size": 2, "model_type": "vilt", "num_attention_heads": 12, "num_channels": 3, "num_hidden_layers": 12, "num_images": -1, "patch_size": 32, "qkv_bias": true, "tie_word_embeddings": false, "torch_dtype": "float32", "transformers_version": "4.35.0", "type_vocab_size": 2, "vocab_size": 30522 }