en_core_web_lg / meta.json
adrianeboyd's picture
Update spaCy pipeline
17c49af
raw
history blame
No virus
10.3 kB
{
"lang":"en",
"name":"core_web_lg",
"version":"3.4.1",
"description":"English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter, ner, attribute_ruler, lemmatizer.",
"author":"Explosion",
"email":"contact@explosion.ai",
"url":"https://explosion.ai",
"license":"MIT",
"spacy_version":">=3.4.0,<3.5.0",
"spacy_git_version":"2b5f955c2",
"vectors":{
"width":300,
"vectors":514157,
"keys":514157,
"name":"en_vectors"
},
"labels":{
"tok2vec":[
],
"tagger":[
"$",
"''",
",",
"-LRB-",
"-RRB-",
".",
":",
"ADD",
"AFX",
"CC",
"CD",
"DT",
"EX",
"FW",
"HYPH",
"IN",
"JJ",
"JJR",
"JJS",
"LS",
"MD",
"NFP",
"NN",
"NNP",
"NNPS",
"NNS",
"PDT",
"POS",
"PRP",
"PRP$",
"RB",
"RBR",
"RBS",
"RP",
"SYM",
"TO",
"UH",
"VB",
"VBD",
"VBG",
"VBN",
"VBP",
"VBZ",
"WDT",
"WP",
"WP$",
"WRB",
"XX",
"_SP",
"``"
],
"parser":[
"ROOT",
"acl",
"acomp",
"advcl",
"advmod",
"agent",
"amod",
"appos",
"attr",
"aux",
"auxpass",
"case",
"cc",
"ccomp",
"compound",
"conj",
"csubj",
"csubjpass",
"dative",
"dep",
"det",
"dobj",
"expl",
"intj",
"mark",
"meta",
"neg",
"nmod",
"npadvmod",
"nsubj",
"nsubjpass",
"nummod",
"oprd",
"parataxis",
"pcomp",
"pobj",
"poss",
"preconj",
"predet",
"prep",
"prt",
"punct",
"quantmod",
"relcl",
"xcomp"
],
"attribute_ruler":[
],
"lemmatizer":[
],
"ner":[
"CARDINAL",
"DATE",
"EVENT",
"FAC",
"GPE",
"LANGUAGE",
"LAW",
"LOC",
"MONEY",
"NORP",
"ORDINAL",
"ORG",
"PERCENT",
"PERSON",
"PRODUCT",
"QUANTITY",
"TIME",
"WORK_OF_ART"
]
},
"pipeline":[
"tok2vec",
"tagger",
"parser",
"attribute_ruler",
"lemmatizer",
"ner"
],
"components":[
"tok2vec",
"tagger",
"parser",
"senter",
"attribute_ruler",
"lemmatizer",
"ner"
],
"disabled":[
"senter"
],
"performance":{
"token_acc":0.9993092439,
"token_p":0.9956819193,
"token_r":0.9957659295,
"token_f":0.9957239226,
"tag_acc":0.9734404547,
"sents_p":0.9179347826,
"sents_r":0.8913516723,
"sents_f":0.90444794,
"dep_uas":0.9204363007,
"dep_las":0.9023174614,
"dep_las_per_type":{
"prep":{
"p":0.8597877625,
"r":0.8669322709,
"f":0.8633452361
},
"det":{
"p":0.9797074284,
"r":0.9803066134,
"f":0.9800069293
},
"pobj":{
"p":0.963921354,
"r":0.9683879835,
"f":0.9661495063
},
"nsubj":{
"p":0.9573359244,
"r":0.94966046,
"f":0.9534827457
},
"aux":{
"p":0.981595092,
"r":0.9828184813,
"f":0.9822064057
},
"advmod":{
"p":0.8567202029,
"r":0.8526838297,
"f":0.8546972508
},
"relcl":{
"p":0.7682926829,
"r":0.7772133527,
"f":0.7727272727
},
"root":{
"p":0.9196058444,
"r":0.8926710205,
"f":0.9059382741
},
"xcomp":{
"p":0.8853797019,
"r":0.8955491744,
"f":0.8904354033
},
"amod":{
"p":0.9199114468,
"r":0.9153223194,
"f":0.9176111454
},
"compound":{
"p":0.9198242724,
"r":0.9328358209,
"f":0.9262843555
},
"poss":{
"p":0.9735205617,
"r":0.9768518519,
"f":0.9751833618
},
"ccomp":{
"p":0.7757201646,
"r":0.8446028513,
"f":0.8086973479
},
"attr":{
"p":0.9064542484,
"r":0.93313709,
"f":0.919602155
},
"case":{
"p":0.9797330697,
"r":0.991991992,
"f":0.9858244218
},
"mark":{
"p":0.9015625,
"r":0.9173290938,
"f":0.9093774626
},
"intj":{
"p":0.680533752,
"r":0.6351648352,
"f":0.6570670709
},
"advcl":{
"p":0.6686002522,
"r":0.6675900277,
"f":0.6680947581
},
"cc":{
"p":0.8381204182,
"r":0.8341107523,
"f":0.8361107781
},
"neg":{
"p":0.9451371571,
"r":0.9508278976,
"f":0.947973987
},
"conj":{
"p":0.7760468594,
"r":0.7838620342,
"f":0.7799348697
},
"nsubjpass":{
"p":0.9234693878,
"r":0.9282051282,
"f":0.925831202
},
"auxpass":{
"p":0.9468791501,
"r":0.9744874715,
"f":0.9604849573
},
"dobj":{
"p":0.9278213166,
"r":0.9434217866,
"f":0.9355565214
},
"nummod":{
"p":0.9377224199,
"r":0.9315656566,
"f":0.9346338992
},
"npadvmod":{
"p":0.7837218189,
"r":0.7285968028,
"f":0.7551546392
},
"prt":{
"p":0.8103025348,
"r":0.8879928315,
"f":0.8473706712
},
"pcomp":{
"p":0.8873937677,
"r":0.8774509804,
"f":0.8823943662
},
"expl":{
"p":0.9809725159,
"r":0.9935760171,
"f":0.9872340426
},
"acl":{
"p":0.7534883721,
"r":0.7070376432,
"f":0.7295243456
},
"agent":{
"p":0.9042735043,
"r":0.9480286738,
"f":0.9256342957
},
"dative":{
"p":0.7725,
"r":0.7087155963,
"f":0.7392344498
},
"acomp":{
"p":0.9080091533,
"r":0.8997732426,
"f":0.9038724374
},
"dep":{
"p":0.3263473054,
"r":0.1769480519,
"f":0.2294736842
},
"csubj":{
"p":0.7045454545,
"r":0.7337278107,
"f":0.7188405797
},
"quantmod":{
"p":0.8531468531,
"r":0.7928513404,
"f":0.8218947368
},
"nmod":{
"p":0.7539432177,
"r":0.5825716027,
"f":0.6572705397
},
"appos":{
"p":0.6997270246,
"r":0.6672451193,
"f":0.6831001555
},
"predet":{
"p":0.8524590164,
"r":0.8927038627,
"f":0.8721174004
},
"preconj":{
"p":0.5684210526,
"r":0.6279069767,
"f":0.5966850829
},
"oprd":{
"p":0.8322368421,
"r":0.7552238806,
"f":0.7918622848
},
"parataxis":{
"p":0.6323119777,
"r":0.4924078091,
"f":0.5536585366
},
"meta":{
"p":0.8461538462,
"r":0.4230769231,
"f":0.5641025641
},
"csubjpass":{
"p":0.4285714286,
"r":0.5,
"f":0.4615384615
}
},
"ents_p":0.8535469108,
"ents_r":0.8592748397,
"ents_f":0.8564012977,
"ents_per_type":{
"DATE":{
"p":0.8657320872,
"r":0.8822222222,
"f":0.8738993711
},
"GPE":{
"p":0.926199262,
"r":0.910181311,
"f":0.9181204277
},
"ORDINAL":{
"p":0.7826086957,
"r":0.8385093168,
"f":0.8095952024
},
"LOC":{
"p":0.6990291262,
"r":0.6878980892,
"f":0.6934189406
},
"ORG":{
"p":0.8197402597,
"r":0.8366914104,
"f":0.8281291
},
"QUANTITY":{
"p":0.7866666667,
"r":0.6483516484,
"f":0.7108433735
},
"CARDINAL":{
"p":0.8249158249,
"r":0.8739595719,
"f":0.8487297921
},
"PERSON":{
"p":0.8759975445,
"r":0.931462141,
"f":0.9028788358
},
"NORP":{
"p":0.921837228,
"r":0.9152,
"f":0.9185066238
},
"FAC":{
"p":0.3958333333,
"r":0.4384615385,
"f":0.4160583942
},
"TIME":{
"p":0.6994382022,
"r":0.7280701754,
"f":0.7134670487
},
"WORK_OF_ART":{
"p":0.4285714286,
"r":0.3556701031,
"f":0.3887323944
},
"MONEY":{
"p":0.9161676647,
"r":0.9031877214,
"f":0.9096313912
},
"EVENT":{
"p":0.59,
"r":0.3390804598,
"f":0.4306569343
},
"LAW":{
"p":0.5846153846,
"r":0.59375,
"f":0.5891472868
},
"PERCENT":{
"p":0.9175911252,
"r":0.886676876,
"f":0.9018691589
},
"PRODUCT":{
"p":0.4482758621,
"r":0.2464454976,
"f":0.3180428135
},
"LANGUAGE":{
"p":0.7692307692,
"r":0.625,
"f":0.6896551724
}
},
"speed":9221.3523549505
},
"sources":[
{
"name":"OntoNotes 5",
"url":"https://catalog.ldc.upenn.edu/LDC2013T19",
"license":"commercial (licensed by Explosion)",
"author":"Ralph Weischedel, Martha Palmer, Mitchell Marcus, Eduard Hovy, Sameer Pradhan, Lance Ramshaw, Nianwen Xue, Ann Taylor, Jeff Kaufman, Michelle Franchini, Mohammed El-Bachouti, Robert Belvin, Ann Houston"
},
{
"name":"ClearNLP Constituent-to-Dependency Conversion",
"url":"https://github.com/clir/clearnlp-guidelines/blob/master/md/components/dependency_conversion.md",
"license":"Citation provided for reference, no code packaged with model",
"author":"Emory University"
},
{
"name":"WordNet 3.0",
"url":"https://wordnet.princeton.edu/",
"author":"Princeton University",
"license":"WordNet 3.0 License"
},
{
"name":"Explosion Vectors (OSCAR 2109 + Wikipedia + OpenSubtitles + WMT News Crawl)",
"url":"https://github.com/explosion/spacy-vectors-builder",
"license":"CC0",
"author":"Explosion"
}
],
"requirements":[
]
}