DeBERTaSSCCVspanTagger / config.json
RJ3vans's picture
add model
29d96ff
{
"_name_or_path": "/tmp/test-richard_bert_base_cased",
"architectures": [
"DebertaV2ForTokenClassification"
],
"attention_probs_dropout_prob": 0.1,
"finetuning_task": "ner",
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "AFTER_ADJECTIVAL",
"1": "AFTER_ADVERBIAL",
"2": "AFTER_CLEFT_CLAUSE",
"3": "AFTER_COGNITIVE_COMMUNICATIVE_VP",
"4": "AFTER_COMPLEX_NP",
"5": "AFTER_COMPLEX_PHRASE",
"6": "AFTER_FREE_RELATIVE_CLAUSE",
"7": "AFTER_INTENSIFYING_CLAUSE",
"8": "AFTER_REPORTING_CLAUSE",
"9": "AFTER_RESTRICTIVE_CLAUSE_GENERIC_HEAD",
"10": "AFTER_WH_PHRASE",
"11": "BEFORE_ADJECTIVAL",
"12": "BEFORE_ADVERBIAL",
"13": "BEFORE_CLEFT_CLAUSE",
"14": "BEFORE_COGNITIVE_COMMUNICATIVE_VP",
"15": "BEFORE_COMPLEX_NP",
"16": "BEFORE_COMPLEX_PHRASE",
"17": "BEFORE_FREE_RELATIVE_CLAUSE",
"18": "BEFORE_INTENSIFYING_CLAUSE",
"19": "BEFORE_REPORTING_CLAUSE",
"20": "BEFORE_RESTRICTIVE_CLAUSE_GENERIC_HEAD",
"21": "BEFORE_WH_PHRASE",
"22": "ERROR",
"23": "IN_ADJECTIVAL",
"24": "IN_ADJECTIVAL_AFTERSIGN",
"25": "IN_ADJECTIVAL_BEFORESIGN",
"26": "IN_ADVERBIAL",
"27": "IN_ADVERBIAL_AFTERSIGN",
"28": "IN_ADVERBIAL_BEFORESIGN",
"29": "IN_CLEFT_CLAUSE",
"30": "IN_CLEFT_CLAUSE_AFTERSIGN",
"31": "IN_CLEFT_CLAUSE_BEFORESIGN",
"32": "IN_COGNITIVE_COMMUNICATIVE_VP",
"33": "IN_COGNITIVE_COMMUNICATIVE_VP_AFTERSIGN",
"34": "IN_COGNITIVE_COMMUNICATIVE_VP_BEFORESIGN",
"35": "IN_COMPLEX_NP",
"36": "IN_COMPLEX_NP_AFTERSIGN",
"37": "IN_COMPLEX_NP_BEFORESIGN",
"38": "IN_COMPLEX_PHRASE",
"39": "IN_COMPLEX_PHRASE_AFTERSIGN",
"40": "IN_COMPLEX_PHRASE_BEFORESIGN",
"41": "IN_FREE_RELATIVE_CLAUSE",
"42": "IN_FREE_RELATIVE_CLAUSE_AFTERSIGN",
"43": "IN_FREE_RELATIVE_CLAUSE_BEFORESIGN",
"44": "IN_INTENSIFYING_CLAUSE",
"45": "IN_INTENSIFYING_CLAUSE_AFTERSIGN",
"46": "IN_INTENSIFYING_CLAUSE_BEFORESIGN",
"47": "IN_REPORTING_CLAUSE_AFTERSIGN",
"48": "IN_REPORTING_CLAUSE_BEFORESIGN",
"49": "IN_RESTRICTIVE_CLAUSE_GENERIC_HEAD",
"50": "IN_RESTRICTIVE_CLAUSE_GENERIC_HEAD_AFTERSIGN",
"51": "IN_RESTRICTIVE_CLAUSE_GENERIC_HEAD_BEFORESIGN",
"52": "IN_WH_PHRASE",
"53": "IN_WH_PHRASE_AFTERSIGN",
"54": "IN_WH_PHRASE_BEFORESIGN",
"55": "UNKNOWN"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"AFTER_ADJECTIVAL": 0,
"AFTER_ADVERBIAL": 1,
"AFTER_CLEFT_CLAUSE": 2,
"AFTER_COGNITIVE_COMMUNICATIVE_VP": 3,
"AFTER_COMPLEX_NP": 4,
"AFTER_COMPLEX_PHRASE": 5,
"AFTER_FREE_RELATIVE_CLAUSE": 6,
"AFTER_INTENSIFYING_CLAUSE": 7,
"AFTER_REPORTING_CLAUSE": 8,
"AFTER_RESTRICTIVE_CLAUSE_GENERIC_HEAD": 9,
"AFTER_WH_PHRASE": 10,
"BEFORE_ADJECTIVAL": 11,
"BEFORE_ADVERBIAL": 12,
"BEFORE_CLEFT_CLAUSE": 13,
"BEFORE_COGNITIVE_COMMUNICATIVE_VP": 14,
"BEFORE_COMPLEX_NP": 15,
"BEFORE_COMPLEX_PHRASE": 16,
"BEFORE_FREE_RELATIVE_CLAUSE": 17,
"BEFORE_INTENSIFYING_CLAUSE": 18,
"BEFORE_REPORTING_CLAUSE": 19,
"BEFORE_RESTRICTIVE_CLAUSE_GENERIC_HEAD": 20,
"BEFORE_WH_PHRASE": 21,
"ERROR": 22,
"IN_ADJECTIVAL": 23,
"IN_ADJECTIVAL_AFTERSIGN": 24,
"IN_ADJECTIVAL_BEFORESIGN": 25,
"IN_ADVERBIAL": 26,
"IN_ADVERBIAL_AFTERSIGN": 27,
"IN_ADVERBIAL_BEFORESIGN": 28,
"IN_CLEFT_CLAUSE": 29,
"IN_CLEFT_CLAUSE_AFTERSIGN": 30,
"IN_CLEFT_CLAUSE_BEFORESIGN": 31,
"IN_COGNITIVE_COMMUNICATIVE_VP": 32,
"IN_COGNITIVE_COMMUNICATIVE_VP_AFTERSIGN": 33,
"IN_COGNITIVE_COMMUNICATIVE_VP_BEFORESIGN": 34,
"IN_COMPLEX_NP": 35,
"IN_COMPLEX_NP_AFTERSIGN": 36,
"IN_COMPLEX_NP_BEFORESIGN": 37,
"IN_COMPLEX_PHRASE": 38,
"IN_COMPLEX_PHRASE_AFTERSIGN": 39,
"IN_COMPLEX_PHRASE_BEFORESIGN": 40,
"IN_FREE_RELATIVE_CLAUSE": 41,
"IN_FREE_RELATIVE_CLAUSE_AFTERSIGN": 42,
"IN_FREE_RELATIVE_CLAUSE_BEFORESIGN": 43,
"IN_INTENSIFYING_CLAUSE": 44,
"IN_INTENSIFYING_CLAUSE_AFTERSIGN": 45,
"IN_INTENSIFYING_CLAUSE_BEFORESIGN": 46,
"IN_REPORTING_CLAUSE_AFTERSIGN": 47,
"IN_REPORTING_CLAUSE_BEFORESIGN": 48,
"IN_RESTRICTIVE_CLAUSE_GENERIC_HEAD": 49,
"IN_RESTRICTIVE_CLAUSE_GENERIC_HEAD_AFTERSIGN": 50,
"IN_RESTRICTIVE_CLAUSE_GENERIC_HEAD_BEFORESIGN": 51,
"IN_WH_PHRASE": 52,
"IN_WH_PHRASE_AFTERSIGN": 53,
"IN_WH_PHRASE_BEFORESIGN": 54,
"UNKNOWN": 55
},
"layer_norm_eps": 1e-07,
"max_position_embeddings": 512,
"max_relative_positions": -1,
"model_type": "deberta-v2",
"norm_rel_ebd": "layer_norm",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"pooler_dropout": 0,
"pooler_hidden_act": "gelu",
"pooler_hidden_size": 768,
"pos_att_type": [
"p2c",
"c2p"
],
"position_biased_input": false,
"position_buckets": 256,
"relative_attention": true,
"share_att_key": true,
"torch_dtype": "float32",
"transformers_version": "4.20.1",
"type_vocab_size": 0,
"vocab_size": 128100
}