{ "lang":"ro", "name":"core_news_lg", "version":"3.3.0", "description":"Romanian pipeline optimized for CPU. Components: tok2vec, tagger, parser, lemmatizer (trainable_lemmatizer), senter, ner, attribute_ruler.", "author":"Explosion", "email":"contact@explosion.ai", "url":"https://explosion.ai", "license":"CC BY-SA 4.0", "spacy_version":">=3.3.0.dev0,<3.4.0", "spacy_git_version":"849bef2de", "vectors":{ "width":300, "vectors":500000, "keys":500000, "name":"ro_vectors" }, "labels":{ "tok2vec":[ ], "tagger":[ "ARROW", "Af", "Afcfp-n", "Afcfson", "Afcfsrn", "Afcmpoy", "Afcms-n", "Afp", "Afp-p-n", "Afp-poy", "Afp-srn", "Afpf--n", "Afpfp-n", "Afpfp-ny", "Afpfpoy", "Afpfpry", "Afpfson", "Afpfsoy", "Afpfsrn", "Afpfsry", "Afpm--n", "Afpmp-n", "Afpmpoy", "Afpmpry", "Afpms-n", "Afpmsoy", "Afpmsry", "Afsfp-n", "Afsfsrn", "BULLET", "COLON", "COMMA", "Ccssp", "Ccsspy", "Crssp", "Csssp", "Cssspy", "DASH", "DBLQ", "Dd3-po---e", "Dd3-po---o", "Dd3fpo", "Dd3fpr", "Dd3fpr---e", "Dd3fpr---o", "Dd3fpr--y", "Dd3fso", "Dd3fso---e", "Dd3fsr", "Dd3fsr---e", "Dd3fsr---o", "Dd3fsr--yo", "Dd3mpo", "Dd3mpr", "Dd3mpr---e", "Dd3mpr---o", "Dd3mso---e", "Dd3msr", "Dd3msr---e", "Dd3msr---o", "Dh1ms", "Dh3fp", "Dh3fso", "Dh3fsr", "Dh3mp", "Dh3ms", "Di3", "Di3-----y", "Di3--r---e", "Di3-po", "Di3-po---e", "Di3-sr", "Di3-sr---e", "Di3-sr--y", "Di3fp", "Di3fpr", "Di3fpr---e", "Di3fso", "Di3fso---e", "Di3fsr", "Di3fsr---e", "Di3mp", "Di3mpr", "Di3mpr---e", "Di3ms", "Di3ms----e", "Di3mso---e", "Di3msr", "Di3msr---e", "Ds1fp-p", "Ds1fp-s", "Ds1fsop", "Ds1fsos", "Ds1fsrp", "Ds1fsrs", "Ds1fsrs-y", "Ds1mp-p", "Ds1mp-s", "Ds1ms-p", "Ds1ms-s", "Ds1msrs-y", "Ds2---s", "Ds2fp-p", "Ds2fp-s", "Ds2fsrp", "Ds2fsrs", "Ds2mp-p", "Ds2mp-s", "Ds2ms-p", "Ds2ms-s", "Ds3---p", "Ds3---s", "Ds3---sy", "Ds3fp-s", "Ds3fsos", "Ds3fsrs", "Ds3mp-s", "Ds3ms-s", "Dw3--r---e", "Dw3-po---e", "Dw3fpr", "Dw3fso---e", "Dw3fsr", "Dw3mpr", "Dw3mso---e", "Dw3msr", "Dz3fsr---e", "Dz3mso---e", "Dz3msr---e", "EQUAL", "EXCL", "EXCLHELLIP", "GE", "GT", "HELLIP", "I", "LCURL", "LPAR", "LSQR", "LT", "M", "Mc-p-d", "Mc-p-l", "Mc-s-b", "Mc-s-d", "Mc-s-l", "Mcfp-l", "Mcfp-ln", "Mcfprln", "Mcfprly", "Mcfsoln", "Mcfsrl", "Mcfsrln", "Mcfsrly", "Mcmp-l", "Mcms-ln", "Mcmsrl", "Mcmsrln", "Mcmsrly", "Mffprln", "Mffsrln", "Mlfpo", "Mlfpr", "Mlmpr", "Mo---l", "Mo---ln", "Mo-s-r", "Mofp-ln", "Mofpoly", "Mofprly", "Mofs-l", "Mofsoln", "Mofsoly", "Mofsrln", "Mofsrly", "Mompoly", "Momprly", "Moms-l", "Moms-ln", "Momsoly", "Momsrly", "Nc", "Nc---n", "Ncf--n", "Ncfp-n", "Ncfpoy", "Ncfpry", "Ncfs-n", "Ncfson", "Ncfsoy", "Ncfsrn", "Ncfsry", "Ncfsryy", "Ncfsvy", "Ncm--n", "Ncmp-n", "Ncmpoy", "Ncmpry", "Ncms-n", "Ncms-ny", "Ncms-y", "Ncmsoy", "Ncmsrn", "Ncmsry", "Ncmsryy", "Ncmsvn", "Ncmsvy", "Np", "Npfson", "Npfsoy", "Npfsrn", "Npfsry", "Npmpoy", "Npmpry", "Npms-n", "Npmsoy", "Npmsry", "PERCENT", "PERIOD", "PLUS", "PLUSMINUS", "Pd3-po", "Pd3fpr", "Pd3fso", "Pd3fsr", "Pd3mpo", "Pd3mpr", "Pd3mpr--y", "Pd3mso", "Pd3msr", "Pi3--r", "Pi3-po", "Pi3-so", "Pi3-sr", "Pi3fpr", "Pi3fso", "Pi3fsr", "Pi3mpr", "Pi3mso", "Pi3msr", "Pi3msr--y", "Pp1-pa--------w", "Pp1-pa--y-----w", "Pp1-pd--------s", "Pp1-pd--------w", "Pp1-pd--y-----w", "Pp1-pr--------s", "Pp1-sa--------s", "Pp1-sa--------w", "Pp1-sa--y-----w", "Pp1-sd--------s", "Pp1-sd--------w", "Pp1-sd--y-----w", "Pp1-sn--------s", "Pp2-----------s", "Pp2-pa--------w", "Pp2-pa--y-----w", "Pp2-pd--------w", "Pp2-pd--y-----w", "Pp2-pr--------s", "Pp2-sa--------s", "Pp2-sa--------w", "Pp2-sa--y-----w", "Pp2-sd--------s", "Pp2-sd--------w", "Pp2-sd--y-----w", "Pp2-sn--------s", "Pp2-so--------s", "Pp2-sr--------s", "Pp3-p---------s", "Pp3-pd--------w", "Pp3-pd--y-----w", "Pp3-po--------s", "Pp3-sd--------w", "Pp3-sd--y-----w", "Pp3-so--------s", "Pp3fpa--------w", "Pp3fpa--y-----w", "Pp3fpr--------s", "Pp3fs---------s", "Pp3fsa--------w", "Pp3fsa--y-----w", "Pp3fso--------s", "Pp3fsr--------s", "Pp3fsr--y-----s", "Pp3mpa--------w", "Pp3mpa--y-----w", "Pp3mpr--------s", "Pp3ms---------s", "Pp3msa--------w", "Pp3msa--y-----w", "Pp3mso--------s", "Pp3msr--------s", "Pp3msr--y-----s", "Ps1fp-s", "Ps1fsrp", "Ps1fsrs", "Ps1mp-p", "Ps1ms-p", "Ps2fp-s", "Ps2fsrp", "Ps2fsrs", "Ps3---p", "Ps3---s", "Ps3fp-s", "Ps3fsrs", "Ps3mp-s", "Ps3ms-s", "Pw3--r", "Pw3-po", "Pw3-so", "Pw3fpr", "Pw3fso", "Pw3mpr", "Pw3mso", "Px3--a--------s", "Px3--a--------w", "Px3--a--y-----w", "Px3--d--------w", "Px3--d--y-----w", "Pz3-sr", "Pz3fsr", "QUEST", "QUOT", "Qf", "Qn", "Qs", "Qs-y", "Qz", "Qz-y", "RCURL", "RPAR", "RSQR", "Rc", "Rgp", "Rgpy", "Rgs", "Rp", "Rw", "Rw-y", "Rz", "SCOLON", "SLASH", "STAR", "Sp", "Spsa", "Spsay", "Spsd", "Spsg", "Td-po", "Tdfpr", "Tdfso", "Tdfsr", "Tdmpr", "Tdmso", "Tdmsr", "Tf-so", "Tffpoy", "Tffpry", "Tffs-y", "Tfmpoy", "Tfms-y", "Tfmsoy", "Tfmsry", "Ti-po", "Tifp-y", "Tifso", "Tifsr", "Timso", "Timsr", "Tsfp", "Tsfs", "Tsmp", "Tsms", "UNDERSC", "Va--1", "Va--1-----y", "Va--1p", "Va--1s", "Va--1s----y", "Va--2p", "Va--2p----y", "Va--2s", "Va--2s----y", "Va--3", "Va--3-----y", "Va--3p", "Va--3p----y", "Va--3s", "Va--3s----y", "Vag", "Vag-------y", "Vaii1", "Vaii2s", "Vaii3p", "Vaii3s", "Vail3p", "Vail3s", "Vaip1p", "Vaip1s", "Vaip2p", "Vaip2s", "Vaip3p", "Vaip3p----y", "Vaip3s", "Vaip3s----y", "Vais3p", "Vais3s", "Vam-2s", "Vanp", "Vap--sm", "Vasp1p", "Vasp1s", "Vasp2p", "Vasp2s", "Vasp3", "Vmg", "Vmg-------y", "Vmii1", "Vmii1-----y", "Vmii2p", "Vmii2s", "Vmii3p", "Vmii3p----y", "Vmii3s", "Vmii3s----y", "Vmil1", "Vmil1p", "Vmil2s", "Vmil3p", "Vmil3p----y", "Vmil3s", "Vmil3s----y", "Vmip1p", "Vmip1p----y", "Vmip1s", "Vmip1s----y", "Vmip2p", "Vmip2s", "Vmip2s----y", "Vmip3", "Vmip3-----y", "Vmip3p", "Vmip3s", "Vmip3s----y", "Vmis1p", "Vmis1s", "Vmis3p", "Vmis3p----y", "Vmis3s", "Vmis3s----y", "Vmm-2p", "Vmm-2s", "Vmnp", "Vmnp------y", "Vmp--pf", "Vmp--pm", "Vmp--sf", "Vmp--sm", "Vmp--sm---y", "Vmsp1p", "Vmsp2p", "Vmsp2s", "Vmsp3", "Vmsp3-----y", "X", "Y", "Ya", "Yn", "Ynfsoy", "Ynfsry", "Ynmsoy", "Ynmsry", "Yp", "Yp,Yn", "Yp-sr", "Yr" ], "parser":[ "ROOT", "acl", "advcl", "advcl:tcl", "advmod", "advmod:tmod", "amod", "appos", "aux", "aux:pass", "case", "cc", "cc:preconj", "ccomp", "ccomp:pmod", "compound", "conj", "cop", "csubj", "csubj:pass", "dep", "det", "expl", "expl:impers", "expl:pass", "expl:poss", "expl:pv", "fixed", "flat", "goeswith", "iobj", "mark", "nmod", "nmod:tmod", "nsubj", "nsubj:pass", "nummod", "obj", "obl", "obl:agent", "obl:pmod", "orphan", "parataxis", "punct", "vocative", "xcomp" ], "attribute_ruler":[ ], "ner":[ "DATETIME", "EVENT", "FACILITY", "GPE", "LANGUAGE", "LOC", "MONEY", "NAT_REL_POL", "NUMERIC_VALUE", "ORDINAL", "ORGANIZATION", "PERIOD", "PERSON", "PRODUCT", "QUANTITY", "WORK_OF_ART" ] }, "pipeline":[ "tok2vec", "tagger", "parser", "lemmatizer", "attribute_ruler", "ner" ], "components":[ "tok2vec", "tagger", "parser", "lemmatizer", "senter", "attribute_ruler", "ner" ], "disabled":[ "senter" ], "performance":{ "token_acc":0.9990029326, "token_p":0.9967350492, "token_r":0.9957244934, "token_f":0.9959492157, "tag_acc":0.9667810127, "sents_p":0.9744966443, "sents_r":0.9654255319, "sents_f":0.9699398798, "dep_uas":0.8881779116, "dep_las":0.8359210815, "dep_las_per_type":{ "root":{ "p":0.8738738739, "r":0.9133709981, "f":0.8931860037 }, "mark":{ "p":0.927756654, "r":0.920754717, "f":0.9242424242 }, "case":{ "p":0.9589453861, "r":0.9546306712, "f":0.9567831642 }, "nmod:tmod":{ "p":0.5853658537, "r":0.2016806723, "f":0.3 }, "amod":{ "p":0.9114359415, "r":0.9028960818, "f":0.9071459136 }, "nsubj":{ "p":0.8717532468, "r":0.8483412322, "f":0.8598879103 }, "nmod":{ "p":0.8199643494, "r":0.8211353088, "f":0.8205494113 }, "aux":{ "p":0.9776119403, "r":0.957952468, "f":0.9676823638 }, "advcl":{ "p":0.5947712418, "r":0.6842105263, "f":0.6363636364 }, "obj":{ "p":0.8274336283, "r":0.8637413395, "f":0.8451977401 }, "det":{ "p":0.9667812142, "r":0.9558323896, "f":0.9612756264 }, "cc":{ "p":0.9411764706, "r":0.9352818372, "f":0.9382198953 }, "conj":{ "p":0.5930232558, "r":0.5318655852, "f":0.5607819181 }, "nummod":{ "p":0.8809891808, "r":0.8850931677, "f":0.8830364059 }, "acl":{ "p":0.8211143695, "r":0.7235142119, "f":0.7692307692 }, "advmod":{ "p":0.818877551, "r":0.8469656992, "f":0.8326848249 }, "obl":{ "p":0.6858359957, "r":0.8172588832, "f":0.7458019687 }, "expl:pass":{ "p":0.7735849057, "r":0.7592592593, "f":0.7663551402 }, "nsubj:pass":{ "p":0.8246753247, "r":0.7743902439, "f":0.7987421384 }, "fixed":{ "p":0.8623655914, "r":0.8477801268, "f":0.855010661 }, "appos":{ "p":0.5085470085, "r":0.4541984733, "f":0.4798387097 }, "parataxis":{ "p":0.0909090909, "r":0.0571428571, "f":0.0701754386 }, "aux:pass":{ "p":0.9215686275, "r":0.94, "f":0.9306930693 }, "nmod:agent":{ "p":0.0, "r":0.0, "f":0.0 }, "ccomp":{ "p":0.873015873, "r":0.8527131783, "f":0.862745098 }, "nmod:pmod":{ "p":0.0, "r":0.0, "f":0.0 }, "iobj":{ "p":0.7710843373, "r":0.7901234568, "f":0.7804878049 }, "flat":{ "p":0.8034825871, "r":0.85, "f":0.8260869565 }, "cop":{ "p":0.8512396694, "r":0.8306451613, "f":0.8408163265 }, "csubj":{ "p":0.8571428571, "r":0.8571428571, "f":0.8571428571 }, "dep":{ "p":0.0, "r":0.0, "f":0.0 }, "obl:agent":{ "p":0.0, "r":0.0, "f":0.0 }, "obl:pmod":{ "p":0.0, "r":0.0, "f":0.0 }, "expl:pv":{ "p":0.7777777778, "r":0.8115942029, "f":0.7943262411 }, "expl":{ "p":0.6285714286, "r":0.8148148148, "f":0.7096774194 }, "vocative":{ "p":0.0, "r":0.0, "f":0.0 }, "expl:poss":{ "p":1.0, "r":0.935483871, "f":0.9666666667 }, "goeswith":{ "p":0.0, "r":0.0, "f":0.0 }, "compound":{ "p":0.3, "r":0.4285714286, "f":0.3529411765 }, "xcomp":{ "p":0.5416666667, "r":0.4814814815, "f":0.5098039216 }, "orphan":{ "p":0.0, "r":0.0, "f":0.0 }, "expl:impers":{ "p":1.0, "r":0.3333333333, "f":0.5 }, "list":{ "p":0.0, "r":0.0, "f":0.0 }, "ccomp:pmod":{ "p":0.3333333333, "r":0.3333333333, "f":0.3333333333 }, "cc:preconj":{ "p":0.0, "r":0.0, "f":0.0 }, "csubj:pass":{ "p":0.0, "r":0.0, "f":0.0 }, "advcl:tcl":{ "p":0.0, "r":0.0, "f":0.0 } }, "lemma_acc":0.9585129152, "pos_acc":0.9403951881, "morph_acc":0.9512416806, "morph_micro_p":0.9885162858, "morph_micro_r":0.9585538495, "morph_micro_f":0.9711599991, "morph_per_feat":{ "Case":{ "p":0.9923332481, "r":0.9876637416, "f":0.9899929887 }, "Gender":{ "p":0.9918074111, "r":0.9837479685, "f":0.9877612502 }, "Number":{ "p":0.9894855851, "r":0.9219424839, "f":0.9545206675 }, "Person":{ "p":0.9853113984, "r":0.9882144962, "f":0.986760812 }, "PronType":{ "p":0.9965373961, "r":0.99447132, "f":0.9955032861 }, "Polarity":{ "p":0.9902597403, "r":1.0, "f":0.9951060359 }, "AdpType":{ "p":0.9996606719, "r":0.9969543147, "f":0.9983056591 }, "Definite":{ "p":0.9890903257, "r":0.9785714286, "f":0.9838027607 }, "Degree":{ "p":0.9554355165, "r":0.9503022163, "f":0.9528619529 }, "VerbForm":{ "p":0.9728656519, "r":0.977393617, "f":0.9751243781 }, "Abbr":{ "p":0.9653465347, "r":0.8705357143, "f":0.9154929577 }, "Poss":{ "p":1.0, "r":0.9975903614, "f":0.9987937274 }, "NumForm":{ "p":0.9709543568, "r":0.3223140496, "f":0.4839710445 }, "NumType":{ "p":0.9794238683, "r":0.3269230769, "f":0.4902162719 }, "Reflex":{ "p":1.0, "r":0.9935897436, "f":0.9967845659 }, "Strength":{ "p":0.992, "r":0.9841269841, "f":0.9880478088 }, "Mood":{ "p":0.9588550984, "r":0.9834862385, "f":0.9710144928 }, "Tense":{ "p":0.9627507163, "r":0.976744186, "f":0.9696969697 }, "Variant":{ "p":0.9933774834, "r":0.9677419355, "f":0.9803921569 }, "Position":{ "p":1.0, "r":0.9910714286, "f":0.9955156951 }, "Number[psor]":{ "p":1.0, "r":0.9666666667, "f":0.9830508475 }, "PartType":{ "p":1.0, "r":0.9459459459, "f":0.9722222222 }, "Foreign":{ "p":0.0, "r":0.0, "f":0.0 } }, "ents_p":0.7552238806, "ents_r":0.7775643488, "ents_f":0.766231308, "ents_per_type":{ "DATETIME":{ "p":0.7781569966, "r":0.7944250871, "f":0.7862068966 }, "ORGANIZATION":{ "p":0.6888217523, "r":0.7261146497, "f":0.7069767442 }, "FACILITY":{ "p":0.5714285714, "r":0.5496183206, "f":0.560311284 }, "NUMERIC_VALUE":{ "p":0.8953974895, "r":0.906779661, "f":0.9010526316 }, "ORDINAL":{ "p":0.8103448276, "r":0.8545454545, "f":0.8318584071 }, "EVENT":{ "p":0.5526315789, "r":0.5675675676, "f":0.56 }, "GPE":{ "p":0.8464912281, "r":0.8873563218, "f":0.8664421998 }, "PERSON":{ "p":0.7164869029, "r":0.7802013423, "f":0.7469879518 }, "NAT_REL_POL":{ "p":0.925170068, "r":0.9066666667, "f":0.9158249158 }, "MONEY":{ "p":0.9038461538, "r":0.8103448276, "f":0.8545454545 }, "PRODUCT":{ "p":0.608, "r":0.5547445255, "f":0.5801526718 }, "LOC":{ "p":0.5256410256, "r":0.5394736842, "f":0.5324675325 }, "WORK_OF_ART":{ "p":0.2631578947, "r":0.2631578947, "f":0.2631578947 }, "QUANTITY":{ "p":0.8, "r":0.9230769231, "f":0.8571428571 }, "PERIOD":{ "p":0.8823529412, "r":0.7142857143, "f":0.7894736842 }, "LANGUAGE":{ "p":0.8, "r":1.0, "f":0.8888888889 } }, "speed":9115.098662697 }, "sources":[ { "name":"UD Romanian RRT v2.8", "url":"https://github.com/UniversalDependencies/UD_Romanian-RRT", "license":"CC BY-SA 4.0", "author":"Barbu Mititelu, Verginica; Irimia, Elena; Perez, Cenel-Augusto; Ion, Radu; Simionescu, Radu; Popel, Martin" }, { "name":"RONEC - the Romanian Named Entity Corpus (ca9ce460)", "url":"https://github.com/dumitrescustefan/ronec", "license":"MIT", "author":"Dumitrescu, Stefan Daniel; Avram, Andrei-Marius; Morogan, Luciana; Toma; Stefan" }, { "name":"Explosion fastText Vectors (cbow, OSCAR Common Crawl + Wikipedia)", "url":"https://spacy.io", "license":"CC0", "author":"Explosion" } ], "requirements":[ ] }