{ "_name_or_path": "MikeGreen2710/model_3_to_train_on_duc_ner", "architectures": [ "RobertaForTokenClassification" ], "attention_probs_dropout_prob": 0.1, "bos_token_id": 0, "classifier_dropout": null, "eos_token_id": 2, "gradient_checkpointing": false, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 768, "id2label": { "0": "OTHER", "1": "B_NOF", "2": "I_NOF", "3": "B_RPI", "4": "I_RPI", "5": "B_PRI", "6": "I_PRI", "7": "B_NOBR", "8": "I_NOBR", "9": "B_NOBA", "10": "B_STU", "11": "B_YCT", "12": "B_COR", "13": "I_COR", "14": "I_STU", "15": "I_NOBA", "16": "I_YCT", "17": "O" }, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "B_COR": 12, "B_NOBA": 9, "B_NOBR": 7, "B_NOF": 1, "B_PRI": 5, "B_RPI": 3, "B_STU": 10, "B_YCT": 11, "I_COR": 13, "I_NOBA": 15, "I_NOBR": 8, "I_NOF": 2, "I_PRI": 6, "I_RPI": 4, "I_STU": 14, "I_YCT": 16, "O": 17, "OTHER": 0 }, "layer_norm_eps": 1e-05, "max_position_embeddings": 258, "model_type": "roberta", "num_attention_heads": 12, "num_hidden_layers": 12, "pad_token_id": 1, "position_embedding_type": "absolute", "tokenizer_class": "PhobertTokenizer", "torch_dtype": "float32", "transformers_version": "4.39.3", "type_vocab_size": 1, "use_cache": true, "vocab_size": 64001 }