{ "_name_or_path": "deepset/gelectra-large", "architectures": [ "ElectraForTokenClassification" ], "attention_probs_dropout_prob": 0.1, "classifier_dropout": null, "embedding_size": 1024, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 1024, "id2label": { "0": "O", "1": "B-LOC", "10": "I-ORGderiv", "11": "B-ORGpart", "12": "I-ORGpart", "13": "B-OTH", "14": "I-OTH", "15": "B-OTHderiv", "16": "I-OTHderiv", "17": "B-OTHpart", "18": "I-OTHpart", "19": "B-PER", "2": "I-LOC", "20": "I-PER", "21": "B-PERderiv", "22": "I-PERderiv", "23": "B-PERpart", "24": "I-PERpart", "3": "B-LOCderiv", "4": "I-LOCderiv", "5": "B-LOCpart", "6": "I-LOCpart", "7": "B-ORG", "8": "I-ORG", "9": "B-ORGderiv" }, "initializer_range": 0.02, "intermediate_size": 4096, "label2id": { "B-LOC": "1", "B-LOCderiv": "3", "B-LOCpart": "5", "B-ORG": "7", "B-ORGderiv": "9", "B-ORGpart": "11", "B-OTH": "13", "B-OTHderiv": "15", "B-OTHpart": "17", "B-PER": "19", "B-PERderiv": "21", "B-PERpart": "23", "I-LOC": "2", "I-LOCderiv": "4", "I-LOCpart": "6", "I-ORG": "8", "I-ORGderiv": "10", "I-ORGpart": "12", "I-OTH": "14", "I-OTHderiv": "16", "I-OTHpart": "18", "I-PER": "20", "I-PERderiv": "22", "I-PERpart": "24", "O": "0" }, "layer_norm_eps": 1e-12, "max_position_embeddings": 512, "model_type": "electra", "num_attention_heads": 16, "num_hidden_layers": 24, "pad_token_id": 0, "position_embedding_type": "absolute", "summary_activation": "gelu", "summary_last_dropout": 0.1, "summary_type": "first", "summary_use_proj": true, "transformers_version": "4.18.0", "type_vocab_size": 2, "use_cache": true, "vocab_size": 31102 }