|
{ |
|
"activation_function": "gelu_new", |
|
"architectures": [ |
|
"GPT2ForTokenClassification" |
|
], |
|
"attn_pdrop": 0.1, |
|
"bos_token_id": 2, |
|
"custom_pipelines": { |
|
"upos": { |
|
"impl": "ud.BellmanFordTokenClassificationPipeline", |
|
"pt": "AutoModelForTokenClassification" |
|
}, |
|
"universal-dependencies": { |
|
"impl": "ud.UniversalDependenciesCausalPipeline", |
|
"pt": "AutoModelForTokenClassification" |
|
} |
|
}, |
|
"embd_pdrop": 0.1, |
|
"eos_token_id": 2, |
|
"id2label": { |
|
"0": "ADJ", |
|
"1": "ADJ|l-acl", |
|
"2": "ADJ|l-advcl", |
|
"3": "ADJ|l-amod", |
|
"4": "ADJ|l-ccomp", |
|
"5": "ADJ|l-csubj", |
|
"6": "ADJ|l-csubj:outer", |
|
"7": "ADJ|l-nmod", |
|
"8": "ADJ|l-nsubj", |
|
"9": "ADJ|l-obj", |
|
"10": "ADJ|l-obl", |
|
"11": "ADJ|r-acl", |
|
"12": "ADJ|r-amod", |
|
"13": "ADJ|r-dep", |
|
"14": "ADJ|root", |
|
"15": "ADP", |
|
"16": "ADP|l-case", |
|
"17": "ADP|r-case", |
|
"18": "ADP|r-fixed", |
|
"19": "ADV", |
|
"20": "ADV|l-advcl", |
|
"21": "ADV|l-advmod", |
|
"22": "ADV|l-obj", |
|
"23": "ADV|r-dep", |
|
"24": "ADV|root", |
|
"25": "AUX", |
|
"26": "AUX|Polarity=Neg", |
|
"27": "AUX|Polarity=Neg|r-aux", |
|
"28": "AUX|Polarity=Neg|r-fixed", |
|
"29": "AUX|r-aux", |
|
"30": "AUX|r-cop", |
|
"31": "AUX|r-fixed", |
|
"32": "AUX|root", |
|
"33": "B-ADJ", |
|
"34": "B-ADP", |
|
"35": "B-ADV", |
|
"36": "B-AUX", |
|
"37": "B-AUX|Polarity=Neg", |
|
"38": "B-CCONJ", |
|
"39": "B-DET", |
|
"40": "B-INTJ", |
|
"41": "B-NOUN", |
|
"42": "B-NOUN|Polarity=Neg", |
|
"43": "B-NUM", |
|
"44": "B-PART", |
|
"45": "B-PRON", |
|
"46": "B-PROPN", |
|
"47": "B-PUNCT", |
|
"48": "B-SCONJ", |
|
"49": "B-SYM", |
|
"50": "B-VERB", |
|
"51": "B-X", |
|
"52": "CCONJ", |
|
"53": "CCONJ|l-cc", |
|
"54": "CCONJ|r-cc", |
|
"55": "DET", |
|
"56": "DET|l-det", |
|
"57": "I-ADJ", |
|
"58": "I-ADP", |
|
"59": "I-ADV", |
|
"60": "I-AUX", |
|
"61": "I-AUX|Polarity=Neg", |
|
"62": "I-CCONJ", |
|
"63": "I-DET", |
|
"64": "I-INTJ", |
|
"65": "I-NOUN", |
|
"66": "I-NOUN|Polarity=Neg", |
|
"67": "I-NUM", |
|
"68": "I-PART", |
|
"69": "I-PRON", |
|
"70": "I-PROPN", |
|
"71": "I-PUNCT", |
|
"72": "I-SCONJ", |
|
"73": "I-SYM", |
|
"74": "I-VERB", |
|
"75": "I-X", |
|
"76": "INTJ", |
|
"77": "INTJ|l-discourse", |
|
"78": "INTJ|r-discourse", |
|
"79": "INTJ|root", |
|
"80": "NOUN", |
|
"81": "NOUN|Polarity=Neg", |
|
"82": "NOUN|Polarity=Neg|l-obl", |
|
"83": "NOUN|Polarity=Neg|root", |
|
"84": "NOUN|l-acl", |
|
"85": "NOUN|l-advcl", |
|
"86": "NOUN|l-ccomp", |
|
"87": "NOUN|l-compound", |
|
"88": "NOUN|l-csubj", |
|
"89": "NOUN|l-csubj:outer", |
|
"90": "NOUN|l-nmod", |
|
"91": "NOUN|l-nsubj", |
|
"92": "NOUN|l-nsubj:outer", |
|
"93": "NOUN|l-obj", |
|
"94": "NOUN|l-obl", |
|
"95": "NOUN|r-compound", |
|
"96": "NOUN|r-nmod", |
|
"97": "NOUN|r-nsubj", |
|
"98": "NOUN|root", |
|
"99": "NUM", |
|
"100": "NUM|l-advcl", |
|
"101": "NUM|l-compound", |
|
"102": "NUM|l-nmod", |
|
"103": "NUM|l-nsubj", |
|
"104": "NUM|l-nsubj:outer", |
|
"105": "NUM|l-nummod", |
|
"106": "NUM|l-obj", |
|
"107": "NUM|l-obl", |
|
"108": "NUM|r-compound", |
|
"109": "NUM|root", |
|
"110": "PART", |
|
"111": "PART|l-mark", |
|
"112": "PART|r-mark", |
|
"113": "PRON", |
|
"114": "PRON|l-acl", |
|
"115": "PRON|l-advcl", |
|
"116": "PRON|l-nmod", |
|
"117": "PRON|l-nsubj", |
|
"118": "PRON|l-nsubj:outer", |
|
"119": "PRON|l-obj", |
|
"120": "PRON|l-obl", |
|
"121": "PRON|root", |
|
"122": "PROPN", |
|
"123": "PROPN|l-acl", |
|
"124": "PROPN|l-advcl", |
|
"125": "PROPN|l-compound", |
|
"126": "PROPN|l-nmod", |
|
"127": "PROPN|l-nsubj", |
|
"128": "PROPN|l-nsubj:outer", |
|
"129": "PROPN|l-obj", |
|
"130": "PROPN|l-obl", |
|
"131": "PROPN|r-compound", |
|
"132": "PROPN|r-nmod", |
|
"133": "PROPN|root", |
|
"134": "PUNCT", |
|
"135": "PUNCT|l-punct", |
|
"136": "PUNCT|r-punct", |
|
"137": "SCONJ", |
|
"138": "SCONJ|l-dep", |
|
"139": "SCONJ|r-fixed", |
|
"140": "SCONJ|r-mark", |
|
"141": "SYM", |
|
"142": "SYM|l-compound", |
|
"143": "SYM|l-dep", |
|
"144": "SYM|l-nmod", |
|
"145": "SYM|l-obl", |
|
"146": "SYM|r-compound", |
|
"147": "SYM|r-dep", |
|
"148": "VERB", |
|
"149": "VERB|l-acl", |
|
"150": "VERB|l-advcl", |
|
"151": "VERB|l-ccomp", |
|
"152": "VERB|l-compound", |
|
"153": "VERB|l-csubj", |
|
"154": "VERB|l-csubj:outer", |
|
"155": "VERB|l-nmod", |
|
"156": "VERB|l-obj", |
|
"157": "VERB|l-obl", |
|
"158": "VERB|r-acl", |
|
"159": "VERB|r-advcl", |
|
"160": "VERB|r-compound", |
|
"161": "VERB|root", |
|
"162": "X", |
|
"163": "X|l-nmod", |
|
"164": "X|r-dep" |
|
}, |
|
"initializer_range": 0.02, |
|
"label2id": { |
|
"ADJ": 0, |
|
"ADJ|l-acl": 1, |
|
"ADJ|l-advcl": 2, |
|
"ADJ|l-amod": 3, |
|
"ADJ|l-ccomp": 4, |
|
"ADJ|l-csubj": 5, |
|
"ADJ|l-csubj:outer": 6, |
|
"ADJ|l-nmod": 7, |
|
"ADJ|l-nsubj": 8, |
|
"ADJ|l-obj": 9, |
|
"ADJ|l-obl": 10, |
|
"ADJ|r-acl": 11, |
|
"ADJ|r-amod": 12, |
|
"ADJ|r-dep": 13, |
|
"ADJ|root": 14, |
|
"ADP": 15, |
|
"ADP|l-case": 16, |
|
"ADP|r-case": 17, |
|
"ADP|r-fixed": 18, |
|
"ADV": 19, |
|
"ADV|l-advcl": 20, |
|
"ADV|l-advmod": 21, |
|
"ADV|l-obj": 22, |
|
"ADV|r-dep": 23, |
|
"ADV|root": 24, |
|
"AUX": 25, |
|
"AUX|Polarity=Neg": 26, |
|
"AUX|Polarity=Neg|r-aux": 27, |
|
"AUX|Polarity=Neg|r-fixed": 28, |
|
"AUX|r-aux": 29, |
|
"AUX|r-cop": 30, |
|
"AUX|r-fixed": 31, |
|
"AUX|root": 32, |
|
"B-ADJ": 33, |
|
"B-ADP": 34, |
|
"B-ADV": 35, |
|
"B-AUX": 36, |
|
"B-AUX|Polarity=Neg": 37, |
|
"B-CCONJ": 38, |
|
"B-DET": 39, |
|
"B-INTJ": 40, |
|
"B-NOUN": 41, |
|
"B-NOUN|Polarity=Neg": 42, |
|
"B-NUM": 43, |
|
"B-PART": 44, |
|
"B-PRON": 45, |
|
"B-PROPN": 46, |
|
"B-PUNCT": 47, |
|
"B-SCONJ": 48, |
|
"B-SYM": 49, |
|
"B-VERB": 50, |
|
"B-X": 51, |
|
"CCONJ": 52, |
|
"CCONJ|l-cc": 53, |
|
"CCONJ|r-cc": 54, |
|
"DET": 55, |
|
"DET|l-det": 56, |
|
"I-ADJ": 57, |
|
"I-ADP": 58, |
|
"I-ADV": 59, |
|
"I-AUX": 60, |
|
"I-AUX|Polarity=Neg": 61, |
|
"I-CCONJ": 62, |
|
"I-DET": 63, |
|
"I-INTJ": 64, |
|
"I-NOUN": 65, |
|
"I-NOUN|Polarity=Neg": 66, |
|
"I-NUM": 67, |
|
"I-PART": 68, |
|
"I-PRON": 69, |
|
"I-PROPN": 70, |
|
"I-PUNCT": 71, |
|
"I-SCONJ": 72, |
|
"I-SYM": 73, |
|
"I-VERB": 74, |
|
"I-X": 75, |
|
"INTJ": 76, |
|
"INTJ|l-discourse": 77, |
|
"INTJ|r-discourse": 78, |
|
"INTJ|root": 79, |
|
"NOUN": 80, |
|
"NOUN|Polarity=Neg": 81, |
|
"NOUN|Polarity=Neg|l-obl": 82, |
|
"NOUN|Polarity=Neg|root": 83, |
|
"NOUN|l-acl": 84, |
|
"NOUN|l-advcl": 85, |
|
"NOUN|l-ccomp": 86, |
|
"NOUN|l-compound": 87, |
|
"NOUN|l-csubj": 88, |
|
"NOUN|l-csubj:outer": 89, |
|
"NOUN|l-nmod": 90, |
|
"NOUN|l-nsubj": 91, |
|
"NOUN|l-nsubj:outer": 92, |
|
"NOUN|l-obj": 93, |
|
"NOUN|l-obl": 94, |
|
"NOUN|r-compound": 95, |
|
"NOUN|r-nmod": 96, |
|
"NOUN|r-nsubj": 97, |
|
"NOUN|root": 98, |
|
"NUM": 99, |
|
"NUM|l-advcl": 100, |
|
"NUM|l-compound": 101, |
|
"NUM|l-nmod": 102, |
|
"NUM|l-nsubj": 103, |
|
"NUM|l-nsubj:outer": 104, |
|
"NUM|l-nummod": 105, |
|
"NUM|l-obj": 106, |
|
"NUM|l-obl": 107, |
|
"NUM|r-compound": 108, |
|
"NUM|root": 109, |
|
"PART": 110, |
|
"PART|l-mark": 111, |
|
"PART|r-mark": 112, |
|
"PRON": 113, |
|
"PRON|l-acl": 114, |
|
"PRON|l-advcl": 115, |
|
"PRON|l-nmod": 116, |
|
"PRON|l-nsubj": 117, |
|
"PRON|l-nsubj:outer": 118, |
|
"PRON|l-obj": 119, |
|
"PRON|l-obl": 120, |
|
"PRON|root": 121, |
|
"PROPN": 122, |
|
"PROPN|l-acl": 123, |
|
"PROPN|l-advcl": 124, |
|
"PROPN|l-compound": 125, |
|
"PROPN|l-nmod": 126, |
|
"PROPN|l-nsubj": 127, |
|
"PROPN|l-nsubj:outer": 128, |
|
"PROPN|l-obj": 129, |
|
"PROPN|l-obl": 130, |
|
"PROPN|r-compound": 131, |
|
"PROPN|r-nmod": 132, |
|
"PROPN|root": 133, |
|
"PUNCT": 134, |
|
"PUNCT|l-punct": 135, |
|
"PUNCT|r-punct": 136, |
|
"SCONJ": 137, |
|
"SCONJ|l-dep": 138, |
|
"SCONJ|r-fixed": 139, |
|
"SCONJ|r-mark": 140, |
|
"SYM": 141, |
|
"SYM|l-compound": 142, |
|
"SYM|l-dep": 143, |
|
"SYM|l-nmod": 144, |
|
"SYM|l-obl": 145, |
|
"SYM|r-compound": 146, |
|
"SYM|r-dep": 147, |
|
"VERB": 148, |
|
"VERB|l-acl": 149, |
|
"VERB|l-advcl": 150, |
|
"VERB|l-ccomp": 151, |
|
"VERB|l-compound": 152, |
|
"VERB|l-csubj": 153, |
|
"VERB|l-csubj:outer": 154, |
|
"VERB|l-nmod": 155, |
|
"VERB|l-obj": 156, |
|
"VERB|l-obl": 157, |
|
"VERB|r-acl": 158, |
|
"VERB|r-advcl": 159, |
|
"VERB|r-compound": 160, |
|
"VERB|root": 161, |
|
"X": 162, |
|
"X|l-nmod": 163, |
|
"X|r-dep": 164 |
|
}, |
|
"layer_norm_epsilon": 1e-05, |
|
"model_type": "gpt2", |
|
"n_embd": 768, |
|
"n_head": 12, |
|
"n_inner": null, |
|
"n_layer": 12, |
|
"n_positions": 1024, |
|
"reorder_and_upcast_attn": false, |
|
"resid_pdrop": 0.1, |
|
"scale_attn_by_inverse_layer_idx": false, |
|
"scale_attn_weights": true, |
|
"summary_activation": null, |
|
"summary_first_dropout": 0.1, |
|
"summary_proj_to_labels": true, |
|
"summary_type": "cls_index", |
|
"summary_use_proj": true, |
|
"tokenizer_class": "JumanReformerTokenizerFast", |
|
"torch_dtype": "float32", |
|
"transformers_version": "4.44.0", |
|
"use_cache": true, |
|
"vocab_size": 32000 |
|
} |
|
|