{ "lang":"en", "name":"core_web_sm", "version":"3.1.0", "description":"English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter, ner, attribute_ruler, lemmatizer.", "author":"Explosion", "email":"contact@explosion.ai", "url":"https://explosion.ai", "license":"MIT", "spacy_version":">=3.1.0,<3.2.0", "spacy_git_version":"caba63b74", "vectors":{ "width":0, "vectors":0, "keys":0, "name":null }, "labels":{ "tok2vec":[ ], "tagger":[ "$", "''", ",", "-LRB-", "-RRB-", ".", ":", "ADD", "AFX", "CC", "CD", "DT", "EX", "FW", "HYPH", "IN", "JJ", "JJR", "JJS", "LS", "MD", "NFP", "NN", "NNP", "NNPS", "NNS", "PDT", "POS", "PRP", "PRP$", "RB", "RBR", "RBS", "RP", "SYM", "TO", "UH", "VB", "VBD", "VBG", "VBN", "VBP", "VBZ", "WDT", "WP", "WP$", "WRB", "XX", "``" ], "parser":[ "ROOT", "acl", "acomp", "advcl", "advmod", "agent", "amod", "appos", "attr", "aux", "auxpass", "case", "cc", "ccomp", "compound", "conj", "csubj", "csubjpass", "dative", "dep", "det", "dobj", "expl", "intj", "mark", "meta", "neg", "nmod", "npadvmod", "nsubj", "nsubjpass", "nummod", "oprd", "parataxis", "pcomp", "pobj", "poss", "preconj", "predet", "prep", "prt", "punct", "quantmod", "relcl", "xcomp" ], "senter":[ "I", "S" ], "attribute_ruler":[ ], "lemmatizer":[ ], "ner":[ "CARDINAL", "DATE", "EVENT", "FAC", "GPE", "LANGUAGE", "LAW", "LOC", "MONEY", "NORP", "ORDINAL", "ORG", "PERCENT", "PERSON", "PRODUCT", "QUANTITY", "TIME", "WORK_OF_ART" ] }, "pipeline":[ "tok2vec", "tagger", "parser", "attribute_ruler", "lemmatizer", "ner" ], "components":[ "tok2vec", "tagger", "parser", "senter", "attribute_ruler", "lemmatizer", "ner" ], "disabled":[ "senter" ], "performance":{ "token_acc":0.9993053983, "tag_acc":0.9720712187, "dep_uas":0.9185392711, "dep_las":0.9001546872, "ents_p":0.8424355924, "ents_r":0.8335336538, "ents_f":0.8379609817, "sents_p":0.9074955788, "sents_r":0.8801372122, "sents_f":0.893607046, "speed":10426.0619939972, "dep_las_per_type":{ "prep":{ "p":0.8554402587, "r":0.8633276418, "f":0.8593658527 }, "det":{ "p":0.9772329247, "r":0.9783087336, "f":0.9777705332 }, "pobj":{ "p":0.9603285837, "r":0.9686628706, "f":0.9644777228 }, "nsubj":{ "p":0.9598718747, "r":0.945279299, "f":0.9525197007 }, "aux":{ "p":0.9795737123, "r":0.9819282471, "f":0.9807495665 }, "advmod":{ "p":0.8538267452, "r":0.8541140838, "f":0.8539703903 }, "relcl":{ "p":0.764978602, "r":0.7783018868, "f":0.7715827338 }, "root":{ "p":0.9199754818, "r":0.8910878026, "f":0.9053012533 }, "xcomp":{ "p":0.8813440672, "r":0.903804738, "f":0.892433103 }, "amod":{ "p":0.9171875, "r":0.9127308066, "f":0.9149537263 }, "compound":{ "p":0.916057391, "r":0.9280463355, "f":0.9220128918 }, "poss":{ "p":0.9744672296, "r":0.9756441224, "f":0.9750553209 }, "ccomp":{ "p":0.7747747748, "r":0.8407331976, "f":0.8064075015 }, "attr":{ "p":0.8989490703, "r":0.9352396972, "f":0.9167353669 }, "case":{ "p":0.9801980198, "r":0.990990991, "f":0.9855649577 }, "mark":{ "p":0.9015392781, "r":0.9001059883, "f":0.9008220631 }, "intj":{ "p":0.6712856043, "r":0.6388278388, "f":0.6546546547 }, "advcl":{ "p":0.6687116564, "r":0.6587761269, "f":0.6637067106 }, "cc":{ "p":0.8426682692, "r":0.8385360603, "f":0.8405970865 }, "neg":{ "p":0.9461346633, "r":0.9518314099, "f":0.9489744872 }, "conj":{ "p":0.7715100422, "r":0.7833585096, "f":0.7773891318 }, "nsubjpass":{ "p":0.9296875, "r":0.9153846154, "f":0.9224806202 }, "auxpass":{ "p":0.9496883348, "r":0.9717539863, "f":0.9605944607 }, "dobj":{ "p":0.919667805, "r":0.9442186628, "f":0.9317815437 }, "nummod":{ "p":0.9341637011, "r":0.928030303, "f":0.9310869014 }, "npadvmod":{ "p":0.7723823976, "r":0.723268206, "f":0.7470188956 }, "prt":{ "p":0.8175842235, "r":0.8915770609, "f":0.852978997 }, "pcomp":{ "p":0.890625, "r":0.8781512605, "f":0.8843441467 }, "expl":{ "p":0.978858351, "r":0.9914346895, "f":0.985106383 }, "acl":{ "p":0.7473745624, "r":0.6988543372, "f":0.7223005357 }, "agent":{ "p":0.8937605396, "r":0.9498207885, "f":0.9209383145 }, "dative":{ "p":0.7608695652, "r":0.7224770642, "f":0.7411764706 }, "acomp":{ "p":0.91184573, "r":0.9006802721, "f":0.9062286105 }, "dep":{ "p":0.3689655172, "r":0.1737012987, "f":0.2362030905 }, "csubj":{ "p":0.6424242424, "r":0.6272189349, "f":0.6347305389 }, "quantmod":{ "p":0.8624667258, "r":0.7896019496, "f":0.8244274809 }, "nmod":{ "p":0.7359073359, "r":0.5807434491, "f":0.6491825613 }, "appos":{ "p":0.7011441648, "r":0.6646420824, "f":0.6824053452 }, "predet":{ "p":0.8514056225, "r":0.9098712446, "f":0.8796680498 }, "preconj":{ "p":0.476635514, "r":0.5930232558, "f":0.5284974093 }, "oprd":{ "p":0.8193979933, "r":0.7313432836, "f":0.7728706625 }, "parataxis":{ "p":0.6336088154, "r":0.4989154013, "f":0.5582524272 }, "meta":{ "p":0.7727272727, "r":0.3269230769, "f":0.4594594595 }, "csubjpass":{ "p":0.5, "r":0.8333333333, "f":0.625 } }, "ents_per_type":{ "DATE":{ "p":0.8659955961, "r":0.873968254, "f":0.8699636593 }, "GPE":{ "p":0.9142529395, "r":0.8892608089, "f":0.9015837104 }, "ORG":{ "p":0.789707419, "r":0.8014316013, "f":0.7955263158 }, "FAC":{ "p":0.3679245283, "r":0.3, "f":0.3305084746 }, "CARDINAL":{ "p":0.8146892655, "r":0.8573127229, "f":0.8354577057 }, "PERSON":{ "p":0.8424487259, "r":0.8847911227, "f":0.8631009233 }, "NORP":{ "p":0.9078415521, "r":0.8984, "f":0.9030960997 }, "ORDINAL":{ "p":0.7787114846, "r":0.8633540373, "f":0.8188512518 }, "LOC":{ "p":0.713740458, "r":0.5955414013, "f":0.6493055556 }, "TIME":{ "p":0.712962963, "r":0.6754385965, "f":0.6936936937 }, "PRODUCT":{ "p":0.5510204082, "r":0.2559241706, "f":0.3495145631 }, "QUANTITY":{ "p":0.842519685, "r":0.5879120879, "f":0.6925566343 }, "WORK_OF_ART":{ "p":0.46875, "r":0.3092783505, "f":0.3726708075 }, "EVENT":{ "p":0.595959596, "r":0.3390804598, "f":0.4322344322 }, "MONEY":{ "p":0.9182692308, "r":0.9020070838, "f":0.9100655152 }, "LAW":{ "p":0.5555555556, "r":0.46875, "f":0.5084745763 }, "PERCENT":{ "p":0.92, "r":0.8805513017, "f":0.8998435055 }, "LANGUAGE":{ "p":0.7692307692, "r":0.625, "f":0.6896551724 } } }, "sources":[ { "name":"OntoNotes 5", "url":"https://catalog.ldc.upenn.edu/LDC2013T19", "license":"commercial (licensed by Explosion)", "author":"Ralph Weischedel, Martha Palmer, Mitchell Marcus, Eduard Hovy, Sameer Pradhan, Lance Ramshaw, Nianwen Xue, Ann Taylor, Jeff Kaufman, Michelle Franchini, Mohammed El-Bachouti, Robert Belvin, Ann Houston" }, { "name":"ClearNLP Constituent-to-Dependency Conversion", "url":"https://github.com/clir/clearnlp-guidelines/blob/master/md/components/dependency_conversion.md", "license":"Citation provided for reference, no code packaged with model", "author":"Emory University" }, { "name":"WordNet 3.0", "url":"https://wordnet.princeton.edu/", "author":"Princeton University", "license":"WordNet 3.0 License" } ], "requirements":[ ] }