{ "lang":"en", "name":"core_web_lg", "version":"3.4.1", "description":"English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter, ner, attribute_ruler, lemmatizer.", "author":"Explosion", "email":"contact@explosion.ai", "url":"https://explosion.ai", "license":"MIT", "spacy_version":">=3.4.0,<3.5.0", "spacy_git_version":"2b5f955c2", "vectors":{ "width":300, "vectors":514157, "keys":514157, "name":"en_vectors" }, "labels":{ "tok2vec":[ ], "tagger":[ "$", "''", ",", "-LRB-", "-RRB-", ".", ":", "ADD", "AFX", "CC", "CD", "DT", "EX", "FW", "HYPH", "IN", "JJ", "JJR", "JJS", "LS", "MD", "NFP", "NN", "NNP", "NNPS", "NNS", "PDT", "POS", "PRP", "PRP$", "RB", "RBR", "RBS", "RP", "SYM", "TO", "UH", "VB", "VBD", "VBG", "VBN", "VBP", "VBZ", "WDT", "WP", "WP$", "WRB", "XX", "_SP", "``" ], "parser":[ "ROOT", "acl", "acomp", "advcl", "advmod", "agent", "amod", "appos", "attr", "aux", "auxpass", "case", "cc", "ccomp", "compound", "conj", "csubj", "csubjpass", "dative", "dep", "det", "dobj", "expl", "intj", "mark", "meta", "neg", "nmod", "npadvmod", "nsubj", "nsubjpass", "nummod", "oprd", "parataxis", "pcomp", "pobj", "poss", "preconj", "predet", "prep", "prt", "punct", "quantmod", "relcl", "xcomp" ], "attribute_ruler":[ ], "lemmatizer":[ ], "ner":[ "CARDINAL", "DATE", "EVENT", "FAC", "GPE", "LANGUAGE", "LAW", "LOC", "MONEY", "NORP", "ORDINAL", "ORG", "PERCENT", "PERSON", "PRODUCT", "QUANTITY", "TIME", "WORK_OF_ART" ] }, "pipeline":[ "tok2vec", "tagger", "parser", "attribute_ruler", "lemmatizer", "ner" ], "components":[ "tok2vec", "tagger", "parser", "senter", "attribute_ruler", "lemmatizer", "ner" ], "disabled":[ "senter" ], "performance":{ "token_acc":0.9993092439, "token_p":0.9956819193, "token_r":0.9957659295, "token_f":0.9957239226, "tag_acc":0.9734404547, "sents_p":0.9179347826, "sents_r":0.8913516723, "sents_f":0.90444794, "dep_uas":0.9204363007, "dep_las":0.9023174614, "dep_las_per_type":{ "prep":{ "p":0.8597877625, "r":0.8669322709, "f":0.8633452361 }, "det":{ "p":0.9797074284, "r":0.9803066134, "f":0.9800069293 }, "pobj":{ "p":0.963921354, "r":0.9683879835, "f":0.9661495063 }, "nsubj":{ "p":0.9573359244, "r":0.94966046, "f":0.9534827457 }, "aux":{ "p":0.981595092, "r":0.9828184813, "f":0.9822064057 }, "advmod":{ "p":0.8567202029, "r":0.8526838297, "f":0.8546972508 }, "relcl":{ "p":0.7682926829, "r":0.7772133527, "f":0.7727272727 }, "root":{ "p":0.9196058444, "r":0.8926710205, "f":0.9059382741 }, "xcomp":{ "p":0.8853797019, "r":0.8955491744, "f":0.8904354033 }, "amod":{ "p":0.9199114468, "r":0.9153223194, "f":0.9176111454 }, "compound":{ "p":0.9198242724, "r":0.9328358209, "f":0.9262843555 }, "poss":{ "p":0.9735205617, "r":0.9768518519, "f":0.9751833618 }, "ccomp":{ "p":0.7757201646, "r":0.8446028513, "f":0.8086973479 }, "attr":{ "p":0.9064542484, "r":0.93313709, "f":0.919602155 }, "case":{ "p":0.9797330697, "r":0.991991992, "f":0.9858244218 }, "mark":{ "p":0.9015625, "r":0.9173290938, "f":0.9093774626 }, "intj":{ "p":0.680533752, "r":0.6351648352, "f":0.6570670709 }, "advcl":{ "p":0.6686002522, "r":0.6675900277, "f":0.6680947581 }, "cc":{ "p":0.8381204182, "r":0.8341107523, "f":0.8361107781 }, "neg":{ "p":0.9451371571, "r":0.9508278976, "f":0.947973987 }, "conj":{ "p":0.7760468594, "r":0.7838620342, "f":0.7799348697 }, "nsubjpass":{ "p":0.9234693878, "r":0.9282051282, "f":0.925831202 }, "auxpass":{ "p":0.9468791501, "r":0.9744874715, "f":0.9604849573 }, "dobj":{ "p":0.9278213166, "r":0.9434217866, "f":0.9355565214 }, "nummod":{ "p":0.9377224199, "r":0.9315656566, "f":0.9346338992 }, "npadvmod":{ "p":0.7837218189, "r":0.7285968028, "f":0.7551546392 }, "prt":{ "p":0.8103025348, "r":0.8879928315, "f":0.8473706712 }, "pcomp":{ "p":0.8873937677, "r":0.8774509804, "f":0.8823943662 }, "expl":{ "p":0.9809725159, "r":0.9935760171, "f":0.9872340426 }, "acl":{ "p":0.7534883721, "r":0.7070376432, "f":0.7295243456 }, "agent":{ "p":0.9042735043, "r":0.9480286738, "f":0.9256342957 }, "dative":{ "p":0.7725, "r":0.7087155963, "f":0.7392344498 }, "acomp":{ "p":0.9080091533, "r":0.8997732426, "f":0.9038724374 }, "dep":{ "p":0.3263473054, "r":0.1769480519, "f":0.2294736842 }, "csubj":{ "p":0.7045454545, "r":0.7337278107, "f":0.7188405797 }, "quantmod":{ "p":0.8531468531, "r":0.7928513404, "f":0.8218947368 }, "nmod":{ "p":0.7539432177, "r":0.5825716027, "f":0.6572705397 }, "appos":{ "p":0.6997270246, "r":0.6672451193, "f":0.6831001555 }, "predet":{ "p":0.8524590164, "r":0.8927038627, "f":0.8721174004 }, "preconj":{ "p":0.5684210526, "r":0.6279069767, "f":0.5966850829 }, "oprd":{ "p":0.8322368421, "r":0.7552238806, "f":0.7918622848 }, "parataxis":{ "p":0.6323119777, "r":0.4924078091, "f":0.5536585366 }, "meta":{ "p":0.8461538462, "r":0.4230769231, "f":0.5641025641 }, "csubjpass":{ "p":0.4285714286, "r":0.5, "f":0.4615384615 } }, "ents_p":0.8535469108, "ents_r":0.8592748397, "ents_f":0.8564012977, "ents_per_type":{ "DATE":{ "p":0.8657320872, "r":0.8822222222, "f":0.8738993711 }, "GPE":{ "p":0.926199262, "r":0.910181311, "f":0.9181204277 }, "ORDINAL":{ "p":0.7826086957, "r":0.8385093168, "f":0.8095952024 }, "LOC":{ "p":0.6990291262, "r":0.6878980892, "f":0.6934189406 }, "ORG":{ "p":0.8197402597, "r":0.8366914104, "f":0.8281291 }, "QUANTITY":{ "p":0.7866666667, "r":0.6483516484, "f":0.7108433735 }, "CARDINAL":{ "p":0.8249158249, "r":0.8739595719, "f":0.8487297921 }, "PERSON":{ "p":0.8759975445, "r":0.931462141, "f":0.9028788358 }, "NORP":{ "p":0.921837228, "r":0.9152, "f":0.9185066238 }, "FAC":{ "p":0.3958333333, "r":0.4384615385, "f":0.4160583942 }, "TIME":{ "p":0.6994382022, "r":0.7280701754, "f":0.7134670487 }, "WORK_OF_ART":{ "p":0.4285714286, "r":0.3556701031, "f":0.3887323944 }, "MONEY":{ "p":0.9161676647, "r":0.9031877214, "f":0.9096313912 }, "EVENT":{ "p":0.59, "r":0.3390804598, "f":0.4306569343 }, "LAW":{ "p":0.5846153846, "r":0.59375, "f":0.5891472868 }, "PERCENT":{ "p":0.9175911252, "r":0.886676876, "f":0.9018691589 }, "PRODUCT":{ "p":0.4482758621, "r":0.2464454976, "f":0.3180428135 }, "LANGUAGE":{ "p":0.7692307692, "r":0.625, "f":0.6896551724 } }, "speed":9221.3523549505 }, "sources":[ { "name":"OntoNotes 5", "url":"https://catalog.ldc.upenn.edu/LDC2013T19", "license":"commercial (licensed by Explosion)", "author":"Ralph Weischedel, Martha Palmer, Mitchell Marcus, Eduard Hovy, Sameer Pradhan, Lance Ramshaw, Nianwen Xue, Ann Taylor, Jeff Kaufman, Michelle Franchini, Mohammed El-Bachouti, Robert Belvin, Ann Houston" }, { "name":"ClearNLP Constituent-to-Dependency Conversion", "url":"https://github.com/clir/clearnlp-guidelines/blob/master/md/components/dependency_conversion.md", "license":"Citation provided for reference, no code packaged with model", "author":"Emory University" }, { "name":"WordNet 3.0", "url":"https://wordnet.princeton.edu/", "author":"Princeton University", "license":"WordNet 3.0 License" }, { "name":"Explosion Vectors (OSCAR 2109 + Wikipedia + OpenSubtitles + WMT News Crawl)", "url":"https://github.com/explosion/spacy-vectors-builder", "license":"CC0", "author":"Explosion" } ], "requirements":[ ] }