{ "_name_or_path": "/home/egil/gits_wsl/SANT_FinalStage/models/01191518_tsa-bin_NorBERT_3_large_final/best_model", "architectures": [ "NorbertForTokenClassification" ], "attention_probs_dropout_prob": 0.1, "auto_map": { "AutoConfig": "configuration_norbert.NorbertConfig", "AutoModel": "ltg/norbert3-large--modeling_norbert.NorbertModel", "AutoModelForMaskedLM": "ltg/norbert3-large--modeling_norbert.NorbertForMaskedLM", "AutoModelForMultipleChoice": "ltg/norbert3-large--modeling_norbert.NorbertForMultipleChoice", "AutoModelForQuestionAnswering": "ltg/norbert3-large--modeling_norbert.NorbertForQuestionAnswering", "AutoModelForSequenceClassification": "ltg/norbert3-large--modeling_norbert.NorbertForSequenceClassification", "AutoModelForTokenClassification": "modeling_norbert.NorbertForTokenClassification" }, "finetuning_task": "01191518_tsa-bin_norbert_3_large", "hidden_dropout_prob": 0.1, "hidden_size": 1024, "id2label": { "0": "O", "1": "B-targ-Negative", "2": "I-targ-Negative", "3": "B-targ-Positive", "4": "I-targ-Positive" }, "intermediate_size": 2730, "label2id": { "B-targ-Negative": 1, "B-targ-Positive": 3, "I-targ-Negative": 2, "I-targ-Positive": 4, "O": 0 }, "layer_norm_eps": 1e-07, "max_position_embeddings": 512, "num_attention_heads": 16, "num_hidden_layers": 24, "output_all_encoded_layers": true, "position_bucket_size": 32, "torch_dtype": "float32", "transformers_version": "4.36.2", "vocab_size": 50000 }