ro_core_news_lg / meta.json
EC2 Default User
Update spaCy pipeline
0c4ebde
raw
history blame
20.1 kB
{
"lang":"ro",
"name":"core_news_lg",
"version":"3.3.0",
"description":"Romanian pipeline optimized for CPU. Components: tok2vec, tagger, parser, lemmatizer (trainable_lemmatizer), senter, ner, attribute_ruler.",
"author":"Explosion",
"email":"contact@explosion.ai",
"url":"https://explosion.ai",
"license":"CC BY-SA 4.0",
"spacy_version":">=3.3.0.dev0,<3.4.0",
"spacy_git_version":"849bef2de",
"vectors":{
"width":300,
"vectors":500000,
"keys":500000,
"name":"ro_vectors"
},
"labels":{
"tok2vec":[
],
"tagger":[
"ARROW",
"Af",
"Afcfp-n",
"Afcfson",
"Afcfsrn",
"Afcmpoy",
"Afcms-n",
"Afp",
"Afp-p-n",
"Afp-poy",
"Afp-srn",
"Afpf--n",
"Afpfp-n",
"Afpfp-ny",
"Afpfpoy",
"Afpfpry",
"Afpfson",
"Afpfsoy",
"Afpfsrn",
"Afpfsry",
"Afpm--n",
"Afpmp-n",
"Afpmpoy",
"Afpmpry",
"Afpms-n",
"Afpmsoy",
"Afpmsry",
"Afsfp-n",
"Afsfsrn",
"BULLET",
"COLON",
"COMMA",
"Ccssp",
"Ccsspy",
"Crssp",
"Csssp",
"Cssspy",
"DASH",
"DBLQ",
"Dd3-po---e",
"Dd3-po---o",
"Dd3fpo",
"Dd3fpr",
"Dd3fpr---e",
"Dd3fpr---o",
"Dd3fpr--y",
"Dd3fso",
"Dd3fso---e",
"Dd3fsr",
"Dd3fsr---e",
"Dd3fsr---o",
"Dd3fsr--yo",
"Dd3mpo",
"Dd3mpr",
"Dd3mpr---e",
"Dd3mpr---o",
"Dd3mso---e",
"Dd3msr",
"Dd3msr---e",
"Dd3msr---o",
"Dh1ms",
"Dh3fp",
"Dh3fso",
"Dh3fsr",
"Dh3mp",
"Dh3ms",
"Di3",
"Di3-----y",
"Di3--r---e",
"Di3-po",
"Di3-po---e",
"Di3-sr",
"Di3-sr---e",
"Di3-sr--y",
"Di3fp",
"Di3fpr",
"Di3fpr---e",
"Di3fso",
"Di3fso---e",
"Di3fsr",
"Di3fsr---e",
"Di3mp",
"Di3mpr",
"Di3mpr---e",
"Di3ms",
"Di3ms----e",
"Di3mso---e",
"Di3msr",
"Di3msr---e",
"Ds1fp-p",
"Ds1fp-s",
"Ds1fsop",
"Ds1fsos",
"Ds1fsrp",
"Ds1fsrs",
"Ds1fsrs-y",
"Ds1mp-p",
"Ds1mp-s",
"Ds1ms-p",
"Ds1ms-s",
"Ds1msrs-y",
"Ds2---s",
"Ds2fp-p",
"Ds2fp-s",
"Ds2fsrp",
"Ds2fsrs",
"Ds2mp-p",
"Ds2mp-s",
"Ds2ms-p",
"Ds2ms-s",
"Ds3---p",
"Ds3---s",
"Ds3---sy",
"Ds3fp-s",
"Ds3fsos",
"Ds3fsrs",
"Ds3mp-s",
"Ds3ms-s",
"Dw3--r---e",
"Dw3-po---e",
"Dw3fpr",
"Dw3fso---e",
"Dw3fsr",
"Dw3mpr",
"Dw3mso---e",
"Dw3msr",
"Dz3fsr---e",
"Dz3mso---e",
"Dz3msr---e",
"EQUAL",
"EXCL",
"EXCLHELLIP",
"GE",
"GT",
"HELLIP",
"I",
"LCURL",
"LPAR",
"LSQR",
"LT",
"M",
"Mc-p-d",
"Mc-p-l",
"Mc-s-b",
"Mc-s-d",
"Mc-s-l",
"Mcfp-l",
"Mcfp-ln",
"Mcfprln",
"Mcfprly",
"Mcfsoln",
"Mcfsrl",
"Mcfsrln",
"Mcfsrly",
"Mcmp-l",
"Mcms-ln",
"Mcmsrl",
"Mcmsrln",
"Mcmsrly",
"Mffprln",
"Mffsrln",
"Mlfpo",
"Mlfpr",
"Mlmpr",
"Mo---l",
"Mo---ln",
"Mo-s-r",
"Mofp-ln",
"Mofpoly",
"Mofprly",
"Mofs-l",
"Mofsoln",
"Mofsoly",
"Mofsrln",
"Mofsrly",
"Mompoly",
"Momprly",
"Moms-l",
"Moms-ln",
"Momsoly",
"Momsrly",
"Nc",
"Nc---n",
"Ncf--n",
"Ncfp-n",
"Ncfpoy",
"Ncfpry",
"Ncfs-n",
"Ncfson",
"Ncfsoy",
"Ncfsrn",
"Ncfsry",
"Ncfsryy",
"Ncfsvy",
"Ncm--n",
"Ncmp-n",
"Ncmpoy",
"Ncmpry",
"Ncms-n",
"Ncms-ny",
"Ncms-y",
"Ncmsoy",
"Ncmsrn",
"Ncmsry",
"Ncmsryy",
"Ncmsvn",
"Ncmsvy",
"Np",
"Npfson",
"Npfsoy",
"Npfsrn",
"Npfsry",
"Npmpoy",
"Npmpry",
"Npms-n",
"Npmsoy",
"Npmsry",
"PERCENT",
"PERIOD",
"PLUS",
"PLUSMINUS",
"Pd3-po",
"Pd3fpr",
"Pd3fso",
"Pd3fsr",
"Pd3mpo",
"Pd3mpr",
"Pd3mpr--y",
"Pd3mso",
"Pd3msr",
"Pi3--r",
"Pi3-po",
"Pi3-so",
"Pi3-sr",
"Pi3fpr",
"Pi3fso",
"Pi3fsr",
"Pi3mpr",
"Pi3mso",
"Pi3msr",
"Pi3msr--y",
"Pp1-pa--------w",
"Pp1-pa--y-----w",
"Pp1-pd--------s",
"Pp1-pd--------w",
"Pp1-pd--y-----w",
"Pp1-pr--------s",
"Pp1-sa--------s",
"Pp1-sa--------w",
"Pp1-sa--y-----w",
"Pp1-sd--------s",
"Pp1-sd--------w",
"Pp1-sd--y-----w",
"Pp1-sn--------s",
"Pp2-----------s",
"Pp2-pa--------w",
"Pp2-pa--y-----w",
"Pp2-pd--------w",
"Pp2-pd--y-----w",
"Pp2-pr--------s",
"Pp2-sa--------s",
"Pp2-sa--------w",
"Pp2-sa--y-----w",
"Pp2-sd--------s",
"Pp2-sd--------w",
"Pp2-sd--y-----w",
"Pp2-sn--------s",
"Pp2-so--------s",
"Pp2-sr--------s",
"Pp3-p---------s",
"Pp3-pd--------w",
"Pp3-pd--y-----w",
"Pp3-po--------s",
"Pp3-sd--------w",
"Pp3-sd--y-----w",
"Pp3-so--------s",
"Pp3fpa--------w",
"Pp3fpa--y-----w",
"Pp3fpr--------s",
"Pp3fs---------s",
"Pp3fsa--------w",
"Pp3fsa--y-----w",
"Pp3fso--------s",
"Pp3fsr--------s",
"Pp3fsr--y-----s",
"Pp3mpa--------w",
"Pp3mpa--y-----w",
"Pp3mpr--------s",
"Pp3ms---------s",
"Pp3msa--------w",
"Pp3msa--y-----w",
"Pp3mso--------s",
"Pp3msr--------s",
"Pp3msr--y-----s",
"Ps1fp-s",
"Ps1fsrp",
"Ps1fsrs",
"Ps1mp-p",
"Ps1ms-p",
"Ps2fp-s",
"Ps2fsrp",
"Ps2fsrs",
"Ps3---p",
"Ps3---s",
"Ps3fp-s",
"Ps3fsrs",
"Ps3mp-s",
"Ps3ms-s",
"Pw3--r",
"Pw3-po",
"Pw3-so",
"Pw3fpr",
"Pw3fso",
"Pw3mpr",
"Pw3mso",
"Px3--a--------s",
"Px3--a--------w",
"Px3--a--y-----w",
"Px3--d--------w",
"Px3--d--y-----w",
"Pz3-sr",
"Pz3fsr",
"QUEST",
"QUOT",
"Qf",
"Qn",
"Qs",
"Qs-y",
"Qz",
"Qz-y",
"RCURL",
"RPAR",
"RSQR",
"Rc",
"Rgp",
"Rgpy",
"Rgs",
"Rp",
"Rw",
"Rw-y",
"Rz",
"SCOLON",
"SLASH",
"STAR",
"Sp",
"Spsa",
"Spsay",
"Spsd",
"Spsg",
"Td-po",
"Tdfpr",
"Tdfso",
"Tdfsr",
"Tdmpr",
"Tdmso",
"Tdmsr",
"Tf-so",
"Tffpoy",
"Tffpry",
"Tffs-y",
"Tfmpoy",
"Tfms-y",
"Tfmsoy",
"Tfmsry",
"Ti-po",
"Tifp-y",
"Tifso",
"Tifsr",
"Timso",
"Timsr",
"Tsfp",
"Tsfs",
"Tsmp",
"Tsms",
"UNDERSC",
"Va--1",
"Va--1-----y",
"Va--1p",
"Va--1s",
"Va--1s----y",
"Va--2p",
"Va--2p----y",
"Va--2s",
"Va--2s----y",
"Va--3",
"Va--3-----y",
"Va--3p",
"Va--3p----y",
"Va--3s",
"Va--3s----y",
"Vag",
"Vag-------y",
"Vaii1",
"Vaii2s",
"Vaii3p",
"Vaii3s",
"Vail3p",
"Vail3s",
"Vaip1p",
"Vaip1s",
"Vaip2p",
"Vaip2s",
"Vaip3p",
"Vaip3p----y",
"Vaip3s",
"Vaip3s----y",
"Vais3p",
"Vais3s",
"Vam-2s",
"Vanp",
"Vap--sm",
"Vasp1p",
"Vasp1s",
"Vasp2p",
"Vasp2s",
"Vasp3",
"Vmg",
"Vmg-------y",
"Vmii1",
"Vmii1-----y",
"Vmii2p",
"Vmii2s",
"Vmii3p",
"Vmii3p----y",
"Vmii3s",
"Vmii3s----y",
"Vmil1",
"Vmil1p",
"Vmil2s",
"Vmil3p",
"Vmil3p----y",
"Vmil3s",
"Vmil3s----y",
"Vmip1p",
"Vmip1p----y",
"Vmip1s",
"Vmip1s----y",
"Vmip2p",
"Vmip2s",
"Vmip2s----y",
"Vmip3",
"Vmip3-----y",
"Vmip3p",
"Vmip3s",
"Vmip3s----y",
"Vmis1p",
"Vmis1s",
"Vmis3p",
"Vmis3p----y",
"Vmis3s",
"Vmis3s----y",
"Vmm-2p",
"Vmm-2s",
"Vmnp",
"Vmnp------y",
"Vmp--pf",
"Vmp--pm",
"Vmp--sf",
"Vmp--sm",
"Vmp--sm---y",
"Vmsp1p",
"Vmsp2p",
"Vmsp2s",
"Vmsp3",
"Vmsp3-----y",
"X",
"Y",
"Ya",
"Yn",
"Ynfsoy",
"Ynfsry",
"Ynmsoy",
"Ynmsry",
"Yp",
"Yp,Yn",
"Yp-sr",
"Yr"
],
"parser":[
"ROOT",
"acl",
"advcl",
"advcl:tcl",
"advmod",
"advmod:tmod",
"amod",
"appos",
"aux",
"aux:pass",
"case",
"cc",
"cc:preconj",
"ccomp",
"ccomp:pmod",
"compound",
"conj",
"cop",
"csubj",
"csubj:pass",
"dep",
"det",
"expl",
"expl:impers",
"expl:pass",
"expl:poss",
"expl:pv",
"fixed",
"flat",
"goeswith",
"iobj",
"mark",
"nmod",
"nmod:tmod",
"nsubj",
"nsubj:pass",
"nummod",
"obj",
"obl",
"obl:agent",
"obl:pmod",
"orphan",
"parataxis",
"punct",
"vocative",
"xcomp"
],
"attribute_ruler":[
],
"ner":[
"DATETIME",
"EVENT",
"FACILITY",
"GPE",
"LANGUAGE",
"LOC",
"MONEY",
"NAT_REL_POL",
"NUMERIC_VALUE",
"ORDINAL",
"ORGANIZATION",
"PERIOD",
"PERSON",
"PRODUCT",
"QUANTITY",
"WORK_OF_ART"
]
},
"pipeline":[
"tok2vec",
"tagger",
"parser",
"lemmatizer",
"attribute_ruler",
"ner"
],
"components":[
"tok2vec",
"tagger",
"parser",
"lemmatizer",
"senter",
"attribute_ruler",
"ner"
],
"disabled":[
"senter"
],
"performance":{
"token_acc":0.9990029326,
"token_p":0.9967350492,
"token_r":0.9957244934,
"token_f":0.9959492157,
"tag_acc":0.9667810127,
"sents_p":0.9744966443,
"sents_r":0.9654255319,
"sents_f":0.9699398798,
"dep_uas":0.8881779116,
"dep_las":0.8359210815,
"dep_las_per_type":{
"root":{
"p":0.8738738739,
"r":0.9133709981,
"f":0.8931860037
},
"mark":{
"p":0.927756654,
"r":0.920754717,
"f":0.9242424242
},
"case":{
"p":0.9589453861,
"r":0.9546306712,
"f":0.9567831642
},
"nmod:tmod":{
"p":0.5853658537,
"r":0.2016806723,
"f":0.3
},
"amod":{
"p":0.9114359415,
"r":0.9028960818,
"f":0.9071459136
},
"nsubj":{
"p":0.8717532468,
"r":0.8483412322,
"f":0.8598879103
},
"nmod":{
"p":0.8199643494,
"r":0.8211353088,
"f":0.8205494113
},
"aux":{
"p":0.9776119403,
"r":0.957952468,
"f":0.9676823638
},
"advcl":{
"p":0.5947712418,
"r":0.6842105263,
"f":0.6363636364
},
"obj":{
"p":0.8274336283,
"r":0.8637413395,
"f":0.8451977401
},
"det":{
"p":0.9667812142,
"r":0.9558323896,
"f":0.9612756264
},
"cc":{
"p":0.9411764706,
"r":0.9352818372,
"f":0.9382198953
},
"conj":{
"p":0.5930232558,
"r":0.5318655852,
"f":0.5607819181
},
"nummod":{
"p":0.8809891808,
"r":0.8850931677,
"f":0.8830364059
},
"acl":{
"p":0.8211143695,
"r":0.7235142119,
"f":0.7692307692
},
"advmod":{
"p":0.818877551,
"r":0.8469656992,
"f":0.8326848249
},
"obl":{
"p":0.6858359957,
"r":0.8172588832,
"f":0.7458019687
},
"expl:pass":{
"p":0.7735849057,
"r":0.7592592593,
"f":0.7663551402
},
"nsubj:pass":{
"p":0.8246753247,
"r":0.7743902439,
"f":0.7987421384
},
"fixed":{
"p":0.8623655914,
"r":0.8477801268,
"f":0.855010661
},
"appos":{
"p":0.5085470085,
"r":0.4541984733,
"f":0.4798387097
},
"parataxis":{
"p":0.0909090909,
"r":0.0571428571,
"f":0.0701754386
},
"aux:pass":{
"p":0.9215686275,
"r":0.94,
"f":0.9306930693
},
"nmod:agent":{
"p":0.0,
"r":0.0,
"f":0.0
},
"ccomp":{
"p":0.873015873,
"r":0.8527131783,
"f":0.862745098
},
"nmod:pmod":{
"p":0.0,
"r":0.0,
"f":0.0
},
"iobj":{
"p":0.7710843373,
"r":0.7901234568,
"f":0.7804878049
},
"flat":{
"p":0.8034825871,
"r":0.85,
"f":0.8260869565
},
"cop":{
"p":0.8512396694,
"r":0.8306451613,
"f":0.8408163265
},
"csubj":{
"p":0.8571428571,
"r":0.8571428571,
"f":0.8571428571
},
"dep":{
"p":0.0,
"r":0.0,
"f":0.0
},
"obl:agent":{
"p":0.0,
"r":0.0,
"f":0.0
},
"obl:pmod":{
"p":0.0,
"r":0.0,
"f":0.0
},
"expl:pv":{
"p":0.7777777778,
"r":0.8115942029,
"f":0.7943262411
},
"expl":{
"p":0.6285714286,
"r":0.8148148148,
"f":0.7096774194
},
"vocative":{
"p":0.0,
"r":0.0,
"f":0.0
},
"expl:poss":{
"p":1.0,
"r":0.935483871,
"f":0.9666666667
},
"goeswith":{
"p":0.0,
"r":0.0,
"f":0.0
},
"compound":{
"p":0.3,
"r":0.4285714286,
"f":0.3529411765
},
"xcomp":{
"p":0.5416666667,
"r":0.4814814815,
"f":0.5098039216
},
"orphan":{
"p":0.0,
"r":0.0,
"f":0.0
},
"expl:impers":{
"p":1.0,
"r":0.3333333333,
"f":0.5
},
"list":{
"p":0.0,
"r":0.0,
"f":0.0
},
"ccomp:pmod":{
"p":0.3333333333,
"r":0.3333333333,
"f":0.3333333333
},
"cc:preconj":{
"p":0.0,
"r":0.0,
"f":0.0
},
"csubj:pass":{
"p":0.0,
"r":0.0,
"f":0.0
},
"advcl:tcl":{
"p":0.0,
"r":0.0,
"f":0.0
}
},
"lemma_acc":0.9585129152,
"pos_acc":0.9403951881,
"morph_acc":0.9512416806,
"morph_micro_p":0.9885162858,
"morph_micro_r":0.9585538495,
"morph_micro_f":0.9711599991,
"morph_per_feat":{
"Case":{
"p":0.9923332481,
"r":0.9876637416,
"f":0.9899929887
},
"Gender":{
"p":0.9918074111,
"r":0.9837479685,
"f":0.9877612502
},
"Number":{
"p":0.9894855851,
"r":0.9219424839,
"f":0.9545206675
},
"Person":{
"p":0.9853113984,
"r":0.9882144962,
"f":0.986760812
},
"PronType":{
"p":0.9965373961,
"r":0.99447132,
"f":0.9955032861
},
"Polarity":{
"p":0.9902597403,
"r":1.0,
"f":0.9951060359
},
"AdpType":{
"p":0.9996606719,
"r":0.9969543147,
"f":0.9983056591
},
"Definite":{
"p":0.9890903257,
"r":0.9785714286,
"f":0.9838027607
},
"Degree":{
"p":0.9554355165,
"r":0.9503022163,
"f":0.9528619529
},
"VerbForm":{
"p":0.9728656519,
"r":0.977393617,
"f":0.9751243781
},
"Abbr":{
"p":0.9653465347,
"r":0.8705357143,
"f":0.9154929577
},
"Poss":{
"p":1.0,
"r":0.9975903614,
"f":0.9987937274
},
"NumForm":{
"p":0.9709543568,
"r":0.3223140496,
"f":0.4839710445
},
"NumType":{
"p":0.9794238683,
"r":0.3269230769,
"f":0.4902162719
},
"Reflex":{
"p":1.0,
"r":0.9935897436,
"f":0.9967845659
},
"Strength":{
"p":0.992,
"r":0.9841269841,
"f":0.9880478088
},
"Mood":{
"p":0.9588550984,
"r":0.9834862385,
"f":0.9710144928
},
"Tense":{
"p":0.9627507163,
"r":0.976744186,
"f":0.9696969697
},
"Variant":{
"p":0.9933774834,
"r":0.9677419355,
"f":0.9803921569
},
"Position":{
"p":1.0,
"r":0.9910714286,
"f":0.9955156951
},
"Number[psor]":{
"p":1.0,
"r":0.9666666667,
"f":0.9830508475
},
"PartType":{
"p":1.0,
"r":0.9459459459,
"f":0.9722222222
},
"Foreign":{
"p":0.0,
"r":0.0,
"f":0.0
}
},
"ents_p":0.7552238806,
"ents_r":0.7775643488,
"ents_f":0.766231308,
"ents_per_type":{
"DATETIME":{
"p":0.7781569966,
"r":0.7944250871,
"f":0.7862068966
},
"ORGANIZATION":{
"p":0.6888217523,
"r":0.7261146497,
"f":0.7069767442
},
"FACILITY":{
"p":0.5714285714,
"r":0.5496183206,
"f":0.560311284
},
"NUMERIC_VALUE":{
"p":0.8953974895,
"r":0.906779661,
"f":0.9010526316
},
"ORDINAL":{
"p":0.8103448276,
"r":0.8545454545,
"f":0.8318584071
},
"EVENT":{
"p":0.5526315789,
"r":0.5675675676,
"f":0.56
},
"GPE":{
"p":0.8464912281,
"r":0.8873563218,
"f":0.8664421998
},
"PERSON":{
"p":0.7164869029,
"r":0.7802013423,
"f":0.7469879518
},
"NAT_REL_POL":{
"p":0.925170068,
"r":0.9066666667,
"f":0.9158249158
},
"MONEY":{
"p":0.9038461538,
"r":0.8103448276,
"f":0.8545454545
},
"PRODUCT":{
"p":0.608,
"r":0.5547445255,
"f":0.5801526718
},
"LOC":{
"p":0.5256410256,
"r":0.5394736842,
"f":0.5324675325
},
"WORK_OF_ART":{
"p":0.2631578947,
"r":0.2631578947,
"f":0.2631578947
},
"QUANTITY":{
"p":0.8,
"r":0.9230769231,
"f":0.8571428571
},
"PERIOD":{
"p":0.8823529412,
"r":0.7142857143,
"f":0.7894736842
},
"LANGUAGE":{
"p":0.8,
"r":1.0,
"f":0.8888888889
}
},
"speed":9115.098662697
},
"sources":[
{
"name":"UD Romanian RRT v2.8",
"url":"https://github.com/UniversalDependencies/UD_Romanian-RRT",
"license":"CC BY-SA 4.0",
"author":"Barbu Mititelu, Verginica; Irimia, Elena; Perez, Cenel-Augusto; Ion, Radu; Simionescu, Radu; Popel, Martin"
},
{
"name":"RONEC - the Romanian Named Entity Corpus (ca9ce460)",
"url":"https://github.com/dumitrescustefan/ronec",
"license":"MIT",
"author":"Dumitrescu, Stefan Daniel; Avram, Andrei-Marius; Morogan, Luciana; Toma; Stefan"
},
{
"name":"Explosion fastText Vectors (cbow, OSCAR Common Crawl + Wikipedia)",
"url":"https://spacy.io",
"license":"CC0",
"author":"Explosion"
}
],
"requirements":[
]
}