mjr27's picture
Update spaCy pipeline
3cd85be
{
"lang":"en",
"name":"egw_entity_extractor",
"version":"1.0.0",
"description":"",
"author":"",
"email":"",
"url":"",
"license":"",
"spacy_version":">=3.7.2,<3.8.0",
"spacy_git_version":"a89eae928",
"vectors":{
"width":300,
"vectors":514157,
"keys":514157,
"name":"en_vectors"
},
"labels":{
"transformer":[
],
"tagger":[
"$",
"''",
",",
"-LRB-",
"-RRB-",
".",
":",
"ADD",
"AFX",
"CC",
"CD",
"DT",
"EX",
"FW",
"HYPH",
"IN",
"JJ",
"JJR",
"JJS",
"LS",
"MD",
"NFP",
"NN",
"NNP",
"NNPS",
"NNS",
"PDT",
"POS",
"PRP",
"PRP$",
"RB",
"RBR",
"RBS",
"RP",
"SYM",
"TO",
"UH",
"VB",
"VBD",
"VBG",
"VBN",
"VBP",
"VBZ",
"WDT",
"WP",
"WP$",
"WRB",
"XX",
"_SP",
"``"
],
"parser":[
"ROOT",
"acl",
"acomp",
"advcl",
"advmod",
"agent",
"amod",
"appos",
"attr",
"aux",
"auxpass",
"case",
"cc",
"ccomp",
"compound",
"conj",
"csubj",
"csubjpass",
"dative",
"dep",
"det",
"dobj",
"expl",
"intj",
"mark",
"meta",
"neg",
"nmod",
"npadvmod",
"nsubj",
"nsubjpass",
"nummod",
"oprd",
"parataxis",
"pcomp",
"pobj",
"poss",
"preconj",
"predet",
"prep",
"prt",
"punct",
"quantmod",
"relcl",
"xcomp"
],
"ner":[
"DATE",
"GPE",
"LOC",
"PERSON",
"REFERENCE"
]
},
"pipeline":[
"transformer",
"tagger",
"parser",
"ner"
],
"components":[
"transformer",
"tagger",
"parser",
"ner"
],
"disabled":[
],
"performance":{
"tag_acc":0.9731235568,
"dep_uas":0.9383889999,
"dep_las":0.9226387112,
"dep_las_per_type":{
"advmod":{
"p":0.9231409577,
"r":0.9217744782,
"f":0.9224572119
},
"nsubj":{
"p":0.9534007948,
"r":0.9545972392,
"f":0.9539986418
},
"ccomp":{
"p":0.7814018505,
"r":0.8102567642,
"f":0.7955677544
},
"det":{
"p":0.9909284441,
"r":0.9906123398,
"f":0.9907703667
},
"dobj":{
"p":0.9367276041,
"r":0.9393668259,
"f":0.9380453586
},
"prep":{
"p":0.9386874981,
"r":0.9381259874,
"f":0.9384066587
},
"pobj":{
"p":0.9836417249,
"r":0.9809672363,
"f":0.9823026602
},
"amod":{
"p":0.9575052607,
"r":0.9573261957,
"f":0.9574157198
},
"compound":{
"p":0.8702260109,
"r":0.853520352,
"f":0.8617922302
},
"root":{
"p":0.9020492679,
"r":0.8982626143,
"f":0.9001519588
},
"appos":{
"p":0.6297298691,
"r":0.6251535312,
"f":0.6274333556
},
"poss":{
"p":0.9901549277,
"r":0.9922373258,
"f":0.991195033
},
"cc":{
"p":0.8949894034,
"r":0.8958846289,
"f":0.8954367924
},
"conj":{
"p":0.8215007338,
"r":0.8155080496,
"f":0.8184934228
},
"attr":{
"p":0.9320448636,
"r":0.9461077844,
"f":0.939023675
},
"nsubjpass":{
"p":0.9538310769,
"r":0.9620016839,
"f":0.9578989575
},
"auxpass":{
"p":0.9857727893,
"r":0.9895852366,
"f":0.987675334
},
"mark":{
"p":0.9466316105,
"r":0.9533155267,
"f":0.9499618117
},
"aux":{
"p":0.9880842784,
"r":0.9887876884,
"f":0.9884358583
},
"neg":{
"p":0.954503393,
"r":0.9570125251,
"f":0.9557563123
},
"agent":{
"p":0.9568527919,
"r":0.9609803922,
"f":0.9589121503
},
"relcl":{
"p":0.8651214999,
"r":0.8472073678,
"f":0.8560707263
},
"nummod":{
"p":0.7994555151,
"r":0.8737622555,
"f":0.8349589233
},
"npadvmod":{
"p":0.563337728,
"r":0.5590688546,
"f":0.5611951733
},
"advcl":{
"p":0.7744648874,
"r":0.7716217848,
"f":0.773040722
},
"acomp":{
"p":0.9436843967,
"r":0.9364503482,
"f":0.9400534555
},
"csubj":{
"p":0.7142857143,
"r":0.6292682927,
"f":0.6690871369
},
"acl":{
"p":0.8031420046,
"r":0.797820401,
"f":0.8004723583
},
"dep":{
"p":0.4068692206,
"r":0.2223291627,
"f":0.2875369535
},
"parataxis":{
"p":0.5267783576,
"r":0.5059351095,
"f":0.516146394
},
"xcomp":{
"p":0.9059485087,
"r":0.9057487736,
"f":0.9058486302
},
"prt":{
"p":0.9491716867,
"r":0.943841258,
"f":0.9464989675
},
"pcomp":{
"p":0.9132833186,
"r":0.899293862,
"f":0.9062346051
},
"dative":{
"p":0.8405797101,
"r":0.8846401719,
"f":0.86204731
},
"expl":{
"p":0.9820100744,
"r":0.9896059947,
"f":0.9857934024
},
"case":{
"p":0.9953598578,
"r":0.99516336,
"f":0.9952615992
},
"intj":{
"p":0.6904276986,
"r":0.6372180451,
"f":0.6627565982
},
"predet":{
"p":0.9538377492,
"r":0.958287596,
"f":0.9560574949
},
"meta":{
"p":0.5658652218,
"r":0.6789922796,
"f":0.6172885113
},
"preconj":{
"p":0.8676069154,
"r":0.9343459089,
"f":0.8997405048
},
"oprd":{
"p":0.8184340321,
"r":0.7984962406,
"f":0.8083422134
},
"nmod":{
"p":0.5855472901,
"r":0.3734327347,
"f":0.4560314504
},
"quantmod":{
"p":0.7594771242,
"r":0.7391857506,
"f":0.7491940683
},
"csubjpass":{
"p":0.6043956044,
"r":0.5188679245,
"f":0.5583756345
}
},
"sents_p":0.9516885336,
"sents_r":0.9476935026,
"sents_f":0.9496868166,
"ents_f":0.8938394961,
"ents_p":0.892504864,
"ents_r":0.8951781257,
"ents_per_type":{
"PERSON":{
"p":0.8599633942,
"r":0.8354645884,
"f":0.8475369884
},
"REFERENCE":{
"p":0.9366869466,
"r":0.9524216668,
"f":0.9444887781
},
"GPE":{
"p":0.8593017196,
"r":0.8481637692,
"f":0.8536964175
},
"DATE":{
"p":0.8488595538,
"r":0.8794252575,
"f":0.8638721197
},
"LOC":{
"p":0.7414030261,
"r":0.8068862275,
"f":0.7727598566
}
},
"transformer_loss":102913.1994540562,
"tagger_loss":12005.9850363731,
"parser_loss":53484.7542075259,
"ner_loss":2973.2796252497
},
"requirements":[
"spacy-transformers>=1.3.3,<1.4.0"
]
}