KoichiYasuoka's picture
model improved
5821aad
raw
history blame
2.85 kB
{
"architectures": [
"DebertaV2ForTokenClassification"
],
"attention_probs_dropout_prob": 0.1,
"bos_token_id": 0,
"eos_token_id": 2,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 1024,
"id2label": {
"0": "B-acl",
"1": "B-advcl",
"2": "B-advmod",
"3": "B-amod",
"4": "B-aux",
"5": "B-case",
"6": "B-cc",
"7": "B-ccomp",
"8": "B-compound",
"9": "B-cop",
"10": "B-csubj",
"11": "B-csubj:outer",
"12": "B-dep",
"13": "B-det",
"14": "B-discourse",
"15": "B-fixed",
"16": "B-mark",
"17": "B-nmod",
"18": "B-nsubj",
"19": "B-nsubj:outer",
"20": "B-nummod",
"21": "B-obj",
"22": "B-obl",
"23": "B-punct",
"24": "B-root",
"25": "I-acl",
"26": "I-advcl",
"27": "I-advmod",
"28": "I-amod",
"29": "I-aux",
"30": "I-case",
"31": "I-cc",
"32": "I-ccomp",
"33": "I-compound",
"34": "I-cop",
"35": "I-csubj",
"36": "I-csubj:outer",
"37": "I-dep",
"38": "I-det",
"39": "I-discourse",
"40": "I-fixed",
"41": "I-mark",
"42": "I-nmod",
"43": "I-nsubj",
"44": "I-nsubj:outer",
"45": "I-nummod",
"46": "I-obj",
"47": "I-obl",
"48": "I-punct",
"49": "I-root"
},
"initializer_range": 0.02,
"intermediate_size": 4096,
"label2id": {
"B-acl": 0,
"B-advcl": 1,
"B-advmod": 2,
"B-amod": 3,
"B-aux": 4,
"B-case": 5,
"B-cc": 6,
"B-ccomp": 7,
"B-compound": 8,
"B-cop": 9,
"B-csubj": 10,
"B-csubj:outer": 11,
"B-dep": 12,
"B-det": 13,
"B-discourse": 14,
"B-fixed": 15,
"B-mark": 16,
"B-nmod": 17,
"B-nsubj": 18,
"B-nsubj:outer": 19,
"B-nummod": 20,
"B-obj": 21,
"B-obl": 22,
"B-punct": 23,
"B-root": 24,
"I-acl": 25,
"I-advcl": 26,
"I-advmod": 27,
"I-amod": 28,
"I-aux": 29,
"I-case": 30,
"I-cc": 31,
"I-ccomp": 32,
"I-compound": 33,
"I-cop": 34,
"I-csubj": 35,
"I-csubj:outer": 36,
"I-dep": 37,
"I-det": 38,
"I-discourse": 39,
"I-fixed": 40,
"I-mark": 41,
"I-nmod": 42,
"I-nsubj": 43,
"I-nsubj:outer": 44,
"I-nummod": 45,
"I-obj": 46,
"I-obl": 47,
"I-punct": 48,
"I-root": 49
},
"layer_norm_eps": 1e-07,
"max_position_embeddings": 512,
"max_relative_positions": -1,
"model_type": "deberta-v2",
"num_attention_heads": 16,
"num_hidden_layers": 24,
"pad_token_id": 1,
"pooler_dropout": 0,
"pooler_hidden_act": "gelu",
"pooler_hidden_size": 1024,
"pos_att_type": [
"p2c",
"c2p"
],
"position_biased_input": false,
"relative_attention": true,
"tokenizer_class": "DebertaV2TokenizerFast",
"torch_dtype": "float32",
"transformers_version": "4.22.1",
"type_vocab_size": 0,
"vocab_size": 32000
}