en_stonk_pipeline / meta.json
FriendlyUser's picture
Update spaCy pipeline
b950e85
{
"lang":"en",
"name":"stonk_pipeline",
"version":"0.0.1",
"description":" pipeline to extract stonk names, need to adjust for general use as some stonk names are very short. Based on the standard spacy pipeline, but added a pipe and wanted to distribute it easily",
"author":"FriendlyUser",
"email":"davidli012345@gmail.com",
"url":"friendlyuser.github.io",
"license":"",
"spacy_version":">=3.4.1,<3.5.0",
"spacy_git_version":"Unknown",
"vectors":{
"width":0,
"vectors":0,
"keys":0,
"name":null
},
"labels":{
"entity_ruler":[
"COMPANY",
"COUNTRY",
"DIVIDENDS",
"INDEX",
"MAYBE",
"STOCK",
"STOCK_EXCHANGE",
"THINGS"
]
},
"pipeline":[
"entity_ruler"
],
"components":[
"entity_ruler"
],
"disabled":[
],
"performance":{
"token_acc":0.9993092439,
"token_p":0.9956819193,
"token_r":0.9957659295,
"token_f":0.9957239226,
"tag_acc":0.9726250474,
"sents_p":0.9191788296,
"sents_r":0.8890428129,
"sents_f":0.9038596962,
"dep_uas":0.9165718428,
"dep_las":0.8978441095,
"dep_las_per_type":{
"prep":{
"p":0.8546376267,
"r":0.8635553026,
"f":0.8590733226
},
"det":{
"p":0.9768701389,
"r":0.9781048683,
"f":0.9774871137
},
"pobj":{
"p":0.9605592002,
"r":0.9659532692,
"f":0.9632486833
},
"nsubj":{
"p":0.9545715675,
"r":0.9463745893,
"f":0.9504554055
},
"aux":{
"p":0.9798401421,
"r":0.9821953174,
"f":0.9810163162
},
"advmod":{
"p":0.8545653823,
"r":0.8527679623,
"f":0.8536657262
},
"relcl":{
"p":0.7656695157,
"r":0.7801161103,
"f":0.7728253055
},
"root":{
"p":0.91776518,
"r":0.8864041164,
"f":0.9018120805
},
"xcomp":{
"p":0.882290562,
"r":0.895908112,
"f":0.889047195
},
"amod":{
"p":0.9154102213,
"r":0.908649174,
"f":0.9120171674
},
"compound":{
"p":0.9121588361,
"r":0.9287703275,
"f":0.9203896355
},
"poss":{
"p":0.9735258724,
"r":0.9770531401,
"f":0.9752863171
},
"ccomp":{
"p":0.7657557167,
"r":0.8389002037,
"f":0.8006609
},
"attr":{
"p":0.9032126881,
"r":0.9339781329,
"f":0.9183378127
},
"case":{
"p":0.9773063641,
"r":0.9914914915,
"f":0.9843478261
},
"mark":{
"p":0.9002893975,
"r":0.9067302597,
"f":0.9034983498
},
"intj":{
"p":0.6514555468,
"r":0.6065934066,
"f":0.6282245827
},
"advcl":{
"p":0.6653050804,
"r":0.6562578696,
"f":0.6607505071
},
"cc":{
"p":0.8285611165,
"r":0.8237052984,
"f":0.8261260721
},
"neg":{
"p":0.9452191235,
"r":0.9523331661,
"f":0.9487628093
},
"conj":{
"p":0.7577601192,
"r":0.7682527694,
"f":0.7629703713
},
"nsubjpass":{
"p":0.9216589862,
"r":0.9230769231,
"f":0.9223674097
},
"auxpass":{
"p":0.946875,
"r":0.9662870159,
"f":0.9564825254
},
"dobj":{
"p":0.919205298,
"r":0.940154594,
"f":0.9295619288
},
"nummod":{
"p":0.9373886485,
"r":0.9300505051,
"f":0.9337051591
},
"npadvmod":{
"p":0.7748549323,
"r":0.7115452931,
"f":0.7418518519
},
"prt":{
"p":0.8097199341,
"r":0.8808243728,
"f":0.843776824
},
"pcomp":{
"p":0.8756183746,
"r":0.8676470588,
"f":0.8716144917
},
"expl":{
"p":0.9809322034,
"r":0.9914346895,
"f":0.9861554846
},
"acl":{
"p":0.7327887981,
"r":0.6852154937,
"f":0.7082041162
},
"agent":{
"p":0.8959044369,
"r":0.9408602151,
"f":0.9178321678
},
"dative":{
"p":0.7846153846,
"r":0.7018348624,
"f":0.7409200969
},
"acomp":{
"p":0.9127423823,
"r":0.8965986395,
"f":0.90459849
},
"dep":{
"p":0.3786764706,
"r":0.1672077922,
"f":0.231981982
},
"csubj":{
"p":0.7393939394,
"r":0.7218934911,
"f":0.7305389222
},
"quantmod":{
"p":0.8694493783,
"r":0.7952883834,
"f":0.8307170132
},
"nmod":{
"p":0.7147169811,
"r":0.577087142,
"f":0.6385704653
},
"appos":{
"p":0.7100509495,
"r":0.6650759219,
"f":0.686827957
},
"predet":{
"p":0.8636363636,
"r":0.8969957082,
"f":0.88
},
"preconj":{
"p":0.5769230769,
"r":0.6976744186,
"f":0.6315789474
},
"oprd":{
"p":0.8160535117,
"r":0.728358209,
"f":0.7697160883
},
"parataxis":{
"p":0.5835694051,
"r":0.4468546638,
"f":0.5061425061
},
"meta":{
"p":0.8666666667,
"r":0.5,
"f":0.6341463415
},
"csubjpass":{
"p":0.5,
"r":0.6666666667,
"f":0.5714285714
}
},
"ents_p":0.8565043157,
"ents_r":0.8348858173,
"ents_f":0.8455569081,
"ents_per_type":{
"DATE":{
"p":0.8804768041,
"r":0.8676190476,
"f":0.8740006396
},
"GPE":{
"p":0.9239884393,
"r":0.8917712692,
"f":0.9075940383
},
"ORDINAL":{
"p":0.7910447761,
"r":0.8229813665,
"f":0.8066971081
},
"ORG":{
"p":0.8107606679,
"r":0.8109756098,
"f":0.8108681246
},
"FAC":{
"p":0.3902439024,
"r":0.3692307692,
"f":0.3794466403
},
"CARDINAL":{
"p":0.8266978923,
"r":0.8394768133,
"f":0.8330383481
},
"PERSON":{
"p":0.8648820905,
"r":0.885770235,
"f":0.8752015479
},
"NORP":{
"p":0.9130787977,
"r":0.8992,
"f":0.9060862555
},
"TIME":{
"p":0.7492163009,
"r":0.6988304094,
"f":0.7231467474
},
"LOC":{
"p":0.7158273381,
"r":0.6337579618,
"f":0.6722972973
},
"QUANTITY":{
"p":0.7971014493,
"r":0.6043956044,
"f":0.6875
},
"EVENT":{
"p":0.6373626374,
"r":0.3333333333,
"f":0.4377358491
},
"WORK_OF_ART":{
"p":0.5230769231,
"r":0.3505154639,
"f":0.4197530864
},
"LAW":{
"p":0.6304347826,
"r":0.453125,
"f":0.5272727273
},
"MONEY":{
"p":0.9179548157,
"r":0.9114521842,
"f":0.9146919431
},
"PERCENT":{
"p":0.9171974522,
"r":0.8820826953,
"f":0.8992974239
},
"PRODUCT":{
"p":0.5,
"r":0.2274881517,
"f":0.3127035831
},
"LANGUAGE":{
"p":0.8,
"r":0.625,
"f":0.701754386
}
},
"speed":9012.0225085527
},
"sources":[
{
"name":"OntoNotes 5",
"url":"https://catalog.ldc.upenn.edu/LDC2013T19",
"license":"commercial (licensed by Explosion)",
"author":"Ralph Weischedel, Martha Palmer, Mitchell Marcus, Eduard Hovy, Sameer Pradhan, Lance Ramshaw, Nianwen Xue, Ann Taylor, Jeff Kaufman, Michelle Franchini, Mohammed El-Bachouti, Robert Belvin, Ann Houston"
},
{
"name":"ClearNLP Constituent-to-Dependency Conversion",
"url":"https://github.com/clir/clearnlp-guidelines/blob/master/md/components/dependency_conversion.md",
"license":"Citation provided for reference, no code packaged with model",
"author":"Emory University"
},
{
"name":"WordNet 3.0",
"url":"https://wordnet.princeton.edu/",
"author":"Princeton University",
"license":"WordNet 3.0 License"
}
],
"requirements":[
]
}