roberta-large-second / config.json
eliza-dukim's picture
ckpt 3045 second model
e9f4609
{
"_name_or_path": "klue/roberta-large",
"architectures": [
"RobertaForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"bos_token_id": 0,
"classifier_dropout": null,
"eos_token_id": 2,
"gradient_checkpointing": false,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 1024,
"id2label": {
"0": "no_relation",
"1": "org:top_members/employees",
"2": "org:members",
"3": "org:product",
"4": "per:title",
"5": "org:alternate_names",
"6": "per:employee_of",
"7": "org:place_of_headquarters",
"8": "per:product",
"9": "org:number_of_employees/members",
"10": "per:children",
"11": "per:place_of_residence",
"12": "per:alternate_names",
"13": "per:other_family",
"14": "per:colleagues",
"15": "per:origin",
"16": "per:siblings",
"17": "per:spouse",
"18": "org:founded",
"19": "org:political/religious_affiliation",
"20": "org:member_of",
"21": "per:parents",
"22": "org:dissolved",
"23": "per:schools_attended",
"24": "per:date_of_death",
"25": "per:date_of_birth",
"26": "per:place_of_birth",
"27": "per:place_of_death",
"28": "org:founded_by",
"29": "per:religion"
},
"initializer_range": 0.02,
"intermediate_size": 4096,
"label2id": {
"no_relation": 0,
"org:alternate_names": 5,
"org:dissolved": 22,
"org:founded": 18,
"org:founded_by": 28,
"org:member_of": 20,
"org:members": 2,
"org:number_of_employees/members": 9,
"org:place_of_headquarters": 7,
"org:political/religious_affiliation": 19,
"org:product": 3,
"org:top_members/employees": 1,
"per:alternate_names": 12,
"per:children": 10,
"per:colleagues": 14,
"per:date_of_birth": 25,
"per:date_of_death": 24,
"per:employee_of": 6,
"per:origin": 15,
"per:other_family": 13,
"per:parents": 21,
"per:place_of_birth": 26,
"per:place_of_death": 27,
"per:place_of_residence": 11,
"per:product": 8,
"per:religion": 29,
"per:schools_attended": 23,
"per:siblings": 16,
"per:spouse": 17,
"per:title": 4
},
"layer_norm_eps": 1e-05,
"max_position_embeddings": 514,
"model_type": "roberta",
"num_attention_heads": 16,
"num_hidden_layers": 24,
"pad_token_id": 1,
"position_embedding_type": "absolute",
"problem_type": "single_label_classification",
"tokenizer_class": "BertTokenizer",
"torch_dtype": "float32",
"transformers_version": "4.11.0.dev0",
"type_vocab_size": 1,
"use_cache": true,
"vocab_size": 32004
}