ro_core_news_lg / meta.json
adrianeboyd's picture
Update spaCy pipeline
11996b5
{
"lang":"ro",
"name":"core_news_lg",
"version":"3.7.0",
"description":"Romanian pipeline optimized for CPU. Components: tok2vec, tagger, parser, lemmatizer (trainable_lemmatizer), senter, ner, attribute_ruler.",
"author":"Explosion",
"email":"contact@explosion.ai",
"url":"https://explosion.ai",
"license":"CC BY-SA 4.0",
"spacy_version":">=3.7.0,<3.8.0",
"spacy_git_version":"6b4f77441",
"vectors":{
"width":300,
"vectors":500000,
"keys":500000,
"name":"ro_vectors"
},
"labels":{
"tok2vec":[
],
"tagger":[
"ARROW",
"Af",
"Afcfp-n",
"Afcfson",
"Afcfsrn",
"Afcmpoy",
"Afcms-n",
"Afp",
"Afp-p-n",
"Afp-poy",
"Afp-srn",
"Afpf--n",
"Afpfp-n",
"Afpfp-ny",
"Afpfpoy",
"Afpfpry",
"Afpfson",
"Afpfsoy",
"Afpfsrn",
"Afpfsry",
"Afpm--n",
"Afpmp-n",
"Afpmpoy",
"Afpmpry",
"Afpms-n",
"Afpmsoy",
"Afpmsry",
"Afsfp-n",
"Afsfsrn",
"BULLET",
"COLON",
"COMMA",
"Ccssp",
"Ccsspy",
"Crssp",
"Csssp",
"Cssspy",
"DASH",
"DBLQ",
"Dd3-po---e",
"Dd3-po---o",
"Dd3fpo",
"Dd3fpr",
"Dd3fpr---e",
"Dd3fpr---o",
"Dd3fpr--y",
"Dd3fso",
"Dd3fso---e",
"Dd3fsr",
"Dd3fsr---e",
"Dd3fsr---o",
"Dd3fsr--yo",
"Dd3mpo",
"Dd3mpr",
"Dd3mpr---e",
"Dd3mpr---o",
"Dd3mso---e",
"Dd3msr",
"Dd3msr---e",
"Dd3msr---o",
"Dh1ms",
"Dh3fp",
"Dh3fso",
"Dh3fsr",
"Dh3mp",
"Dh3ms",
"Di3",
"Di3-----y",
"Di3--r---e",
"Di3-po",
"Di3-po---e",
"Di3-sr",
"Di3-sr---e",
"Di3-sr--y",
"Di3fp",
"Di3fpr",
"Di3fpr---e",
"Di3fso",
"Di3fso---e",
"Di3fsr",
"Di3fsr---e",
"Di3mp",
"Di3mpr",
"Di3mpr---e",
"Di3ms",
"Di3ms----e",
"Di3mso---e",
"Di3msr",
"Di3msr---e",
"Ds1fp-p",
"Ds1fp-s",
"Ds1fsop",
"Ds1fsos",
"Ds1fsrp",
"Ds1fsrs",
"Ds1fsrs-y",
"Ds1mp-p",
"Ds1mp-s",
"Ds1ms-p",
"Ds1ms-s",
"Ds1msrs-y",
"Ds2---s",
"Ds2fp-p",
"Ds2fp-s",
"Ds2fsrp",
"Ds2fsrs",
"Ds2mp-p",
"Ds2mp-s",
"Ds2ms-p",
"Ds2ms-s",
"Ds3---p",
"Ds3---s",
"Ds3---sy",
"Ds3fp-s",
"Ds3fsos",
"Ds3fsrs",
"Ds3mp-s",
"Ds3ms-s",
"Dw3--r---e",
"Dw3-po---e",
"Dw3fpr",
"Dw3fso---e",
"Dw3fsr",
"Dw3mpr",
"Dw3mso---e",
"Dw3msr",
"Dz3fsr---e",
"Dz3mso---e",
"Dz3msr---e",
"EQUAL",
"EXCL",
"EXCLHELLIP",
"GE",
"GT",
"HELLIP",
"I",
"LCURL",
"LPAR",
"LSQR",
"LT",
"M",
"Mc-p-d",
"Mc-p-l",
"Mc-s-b",
"Mc-s-d",
"Mc-s-l",
"Mcfp-l",
"Mcfp-ln",
"Mcfprln",
"Mcfprly",
"Mcfsoln",
"Mcfsrl",
"Mcfsrln",
"Mcfsrly",
"Mcmp-l",
"Mcms-ln",
"Mcmsrl",
"Mcmsrln",
"Mcmsrly",
"Mffprln",
"Mffsrln",
"Mlfpo",
"Mlfpr",
"Mlmpr",
"Mo---l",
"Mo---ln",
"Mo-s-r",
"Mofp-ln",
"Mofpoly",
"Mofprly",
"Mofs-l",
"Mofsoln",
"Mofsoly",
"Mofsrln",
"Mofsrly",
"Mompoly",
"Momprly",
"Moms-l",
"Moms-ln",
"Momsoly",
"Momsrly",
"Nc",
"Nc---n",
"Ncf--n",
"Ncfp-n",
"Ncfpoy",
"Ncfpry",
"Ncfs-n",
"Ncfson",
"Ncfsoy",
"Ncfsrn",
"Ncfsry",
"Ncfsryy",
"Ncfsvy",
"Ncm--n",
"Ncmp-n",
"Ncmpoy",
"Ncmpry",
"Ncms-n",
"Ncms-ny",
"Ncms-y",
"Ncmsoy",
"Ncmsrn",
"Ncmsry",
"Ncmsryy",
"Ncmsvn",
"Ncmsvy",
"Np",
"Npfson",
"Npfsoy",
"Npfsrn",
"Npfsry",
"Npmpoy",
"Npmpry",
"Npms-n",
"Npmsoy",
"Npmsry",
"PERCENT",
"PERIOD",
"PLUS",
"PLUSMINUS",
"Pd3-po",
"Pd3fpr",
"Pd3fso",
"Pd3fsr",
"Pd3mpo",
"Pd3mpr",
"Pd3mpr--y",
"Pd3mso",
"Pd3msr",
"Pi3--r",
"Pi3-po",
"Pi3-so",
"Pi3-sr",
"Pi3fpr",
"Pi3fso",
"Pi3fsr",
"Pi3mpr",
"Pi3mso",
"Pi3msr",
"Pi3msr--y",
"Pp1-pa--------w",
"Pp1-pa--y-----w",
"Pp1-pd--------s",
"Pp1-pd--------w",
"Pp1-pd--y-----w",
"Pp1-pr--------s",
"Pp1-sa--------s",
"Pp1-sa--------w",
"Pp1-sa--y-----w",
"Pp1-sd--------s",
"Pp1-sd--------w",
"Pp1-sd--y-----w",
"Pp1-sn--------s",
"Pp2-----------s",
"Pp2-pa--------w",
"Pp2-pa--y-----w",
"Pp2-pd--------w",
"Pp2-pd--y-----w",
"Pp2-pr--------s",
"Pp2-sa--------s",
"Pp2-sa--------w",
"Pp2-sa--y-----w",
"Pp2-sd--------s",
"Pp2-sd--------w",
"Pp2-sd--y-----w",
"Pp2-sn--------s",
"Pp2-so--------s",
"Pp2-sr--------s",
"Pp3-p---------s",
"Pp3-pd--------w",
"Pp3-pd--y-----w",
"Pp3-po--------s",
"Pp3-sd--------w",
"Pp3-sd--y-----w",
"Pp3-so--------s",
"Pp3fpa--------w",
"Pp3fpa--y-----w",
"Pp3fpr--------s",
"Pp3fs---------s",
"Pp3fsa--------w",
"Pp3fsa--y-----w",
"Pp3fso--------s",
"Pp3fsr--------s",
"Pp3fsr--y-----s",
"Pp3mpa--------w",
"Pp3mpa--y-----w",
"Pp3mpr--------s",
"Pp3ms---------s",
"Pp3msa--------w",
"Pp3msa--y-----w",
"Pp3mso--------s",
"Pp3msr--------s",
"Pp3msr--y-----s",
"Ps1fp-s",
"Ps1fsrp",
"Ps1fsrs",
"Ps1mp-p",
"Ps1ms-p",
"Ps2fp-s",
"Ps2fsrp",
"Ps2fsrs",
"Ps3---p",
"Ps3---s",
"Ps3fp-s",
"Ps3fsrs",
"Ps3mp-s",
"Ps3ms-s",
"Pw3--r",
"Pw3-po",
"Pw3-so",
"Pw3fpr",
"Pw3fso",
"Pw3mpr",
"Pw3mso",
"Px3--a--------s",
"Px3--a--------w",
"Px3--a--y-----w",
"Px3--d--------w",
"Px3--d--y-----w",
"Pz3-sr",
"Pz3fsr",
"QUEST",
"QUOT",
"Qf",
"Qn",
"Qs",
"Qs-y",
"Qz",
"Qz-y",
"RCURL",
"RPAR",
"RSQR",
"Rc",
"Rgp",
"Rgpy",
"Rgs",
"Rp",
"Rw",
"Rw-y",
"Rz",
"SCOLON",
"SLASH",
"STAR",
"Sp",
"Spsa",
"Spsay",
"Spsd",
"Spsg",
"Td-po",
"Tdfpr",
"Tdfso",
"Tdfsr",
"Tdmpr",
"Tdmso",
"Tdmsr",
"Tf-so",
"Tffpoy",
"Tffpry",
"Tffs-y",
"Tfmpoy",
"Tfms-y",
"Tfmsoy",
"Tfmsry",
"Ti-po",
"Tifp-y",
"Tifso",
"Tifsr",
"Timso",
"Timsr",
"Tsfp",
"Tsfs",
"Tsmp",
"Tsms",
"UNDERSC",
"Va--1",
"Va--1-----y",
"Va--1p",
"Va--1s",
"Va--1s----y",
"Va--2p",
"Va--2p----y",
"Va--2s",
"Va--2s----y",
"Va--3",
"Va--3-----y",
"Va--3p",
"Va--3p----y",
"Va--3s",
"Va--3s----y",
"Vag",
"Vag-------y",
"Vaii1",
"Vaii2s",
"Vaii3p",
"Vaii3s",
"Vail3p",
"Vail3s",
"Vaip1p",
"Vaip1s",
"Vaip2p",
"Vaip2s",
"Vaip3p",
"Vaip3p----y",
"Vaip3s",
"Vaip3s----y",
"Vais3p",
"Vais3s",
"Vam-2s",
"Vanp",
"Vap--sm",
"Vasp1p",
"Vasp1s",
"Vasp2p",
"Vasp2s",
"Vasp3",
"Vmg",
"Vmg-------y",
"Vmii1",
"Vmii1-----y",
"Vmii2p",
"Vmii2s",
"Vmii3p",
"Vmii3p----y",
"Vmii3s",
"Vmii3s----y",
"Vmil1",
"Vmil1p",
"Vmil2s",
"Vmil3p",
"Vmil3p----y",
"Vmil3s",
"Vmil3s----y",
"Vmip1p",
"Vmip1p----y",
"Vmip1s",
"Vmip1s----y",
"Vmip2p",
"Vmip2s",
"Vmip2s----y",
"Vmip3",
"Vmip3-----y",
"Vmip3p",
"Vmip3s",
"Vmip3s----y",
"Vmis1p",
"Vmis1s",
"Vmis3p",
"Vmis3p----y",
"Vmis3s",
"Vmis3s----y",
"Vmm-2p",
"Vmm-2s",
"Vmnp",
"Vmnp------y",
"Vmp--pf",
"Vmp--pm",
"Vmp--sf",
"Vmp--sm",
"Vmp--sm---y",
"Vmsp1p",
"Vmsp2p",
"Vmsp2s",
"Vmsp3",
"Vmsp3-----y",
"X",
"Y",
"Ya",
"Yn",
"Ynfsoy",
"Ynfsry",
"Ynmsoy",
"Ynmsry",
"Yp",
"Yp,Yn",
"Yp-sr",
"Yr",
"_SP"
],
"parser":[
"ROOT",
"acl",
"advcl",
"advcl:tcl",
"advmod",
"advmod:tmod",
"amod",
"appos",
"aux",
"aux:pass",
"case",
"cc",
"cc:preconj",
"ccomp",
"ccomp:pmod",
"compound",
"conj",
"cop",
"csubj",
"csubj:pass",
"dep",
"det",
"expl",
"expl:impers",
"expl:pass",
"expl:poss",
"expl:pv",
"fixed",
"flat",
"goeswith",
"iobj",
"mark",
"nmod",
"nmod:tmod",
"nsubj",
"nsubj:pass",
"nummod",
"obj",
"obl",
"obl:agent",
"obl:pmod",
"orphan",
"parataxis",
"punct",
"vocative",
"xcomp"
],
"attribute_ruler":[
],
"ner":[
"DATETIME",
"EVENT",
"FACILITY",
"GPE",
"LANGUAGE",
"LOC",
"MONEY",
"NAT_REL_POL",
"NUMERIC_VALUE",
"ORDINAL",
"ORGANIZATION",
"PERIOD",
"PERSON",
"PRODUCT",
"QUANTITY",
"WORK_OF_ART"
]
},
"pipeline":[
"tok2vec",
"tagger",
"parser",
"lemmatizer",
"attribute_ruler",
"ner"
],
"components":[
"tok2vec",
"tagger",
"parser",
"lemmatizer",
"senter",
"attribute_ruler",
"ner"
],
"disabled":[
"senter"
],
"performance":{
"token_acc":0.9980078514,
"token_p":0.9967350492,
"token_r":0.9957244934,
"token_f":0.9959492157,
"tag_acc":0.9657255109,
"sents_p":0.9732262383,
"sents_r":0.9667553191,
"sents_f":0.9699799867,
"dep_uas":0.8875784191,
"dep_las":0.8359473024,
"dep_las_per_type":{
"root":{
"p":0.8880733945,
"r":0.9114877589,
"f":0.8996282528
},
"mark":{
"p":0.9138576779,
"r":0.920754717,
"f":0.9172932331
},
"case":{
"p":0.9649585531,
"r":0.9602549681,
"f":0.9626010148
},
"nmod:tmod":{
"p":0.6538461538,
"r":0.1428571429,
"f":0.2344827586
},
"amod":{
"p":0.9165957447,
"r":0.9173764906,
"f":0.9169859515
},
"nsubj":{
"p":0.8585365854,
"r":0.8341232227,
"f":0.8461538462
},
"nmod":{
"p":0.82421875,
"r":0.8286326312,
"f":0.826419797
},
"aux":{
"p":0.9737335835,
"r":0.9488117002,
"f":0.9611111111
},
"advcl":{
"p":0.618705036,
"r":0.6466165414,
"f":0.6323529412
},
"obj":{
"p":0.811440678,
"r":0.8845265589,
"f":0.8464088398
},
"det":{
"p":0.9608745685,
"r":0.9456398641,
"f":0.953196347
},
"cc":{
"p":0.9308176101,
"r":0.9269311065,
"f":0.9288702929
},
"conj":{
"p":0.5862068966,
"r":0.5515643105,
"f":0.568358209
},
"nummod":{
"p":0.8687022901,
"r":0.8835403727,
"f":0.8760585065
},
"acl":{
"p":0.8,
"r":0.7131782946,
"f":0.7540983607
},
"advmod":{
"p":0.8324742268,
"r":0.8522427441,
"f":0.8422425033
},
"obl":{
"p":0.6857142857,
"r":0.8223350254,
"f":0.7478361223
},
"expl:pass":{
"p":0.8,
"r":0.7407407407,
"f":0.7692307692
},
"nsubj:pass":{
"p":0.8039215686,
"r":0.75,
"f":0.7760252366
},
"fixed":{
"p":0.8815789474,
"r":0.8498942918,
"f":0.8654467169
},
"appos":{
"p":0.49,
"r":0.3740458015,
"f":0.4242424242
},
"parataxis":{
"p":0.1960784314,
"r":0.2857142857,
"f":0.2325581395
},
"aux:pass":{
"p":0.9205298013,
"r":0.9266666667,
"f":0.9235880399
},
"nmod:agent":{
"p":0.0,
"r":0.0,
"f":0.0
},
"ccomp":{
"p":0.8604651163,
"r":0.8604651163,
"f":0.8604651163
},
"nmod:pmod":{
"p":0.0,
"r":0.0,
"f":0.0
},
"iobj":{
"p":0.7692307692,
"r":0.7407407407,
"f":0.7547169811
},
"flat":{
"p":0.8010335917,
"r":0.8157894737,
"f":0.8083441982
},
"cop":{
"p":0.7936507937,
"r":0.8064516129,
"f":0.8
},
"csubj":{
"p":0.8823529412,
"r":0.7142857143,
"f":0.7894736842
},
"obl:agent":{
"p":0.0,
"r":0.0,
"f":0.0
},
"dep":{
"p":0.0,
"r":0.0,
"f":0.0
},
"obl:pmod":{
"p":0.0,
"r":0.0,
"f":0.0
},
"expl:pv":{
"p":0.7887323944,
"r":0.8115942029,
"f":0.8
},
"expl":{
"p":0.6470588235,
"r":0.8148148148,
"f":0.7213114754
},
"expl:poss":{
"p":0.9655172414,
"r":0.9032258065,
"f":0.9333333333
},
"goeswith":{
"p":0.0,
"r":0.0,
"f":0.0
},
"compound":{
"p":0.5,
"r":0.2857142857,
"f":0.3636363636
},
"xcomp":{
"p":0.5172413793,
"r":0.5555555556,
"f":0.5357142857
},
"orphan":{
"p":0.0,
"r":0.0,
"f":0.0
},
"expl:impers":{
"p":0.5,
"r":0.3333333333,
"f":0.4
},
"list":{
"p":0.0,
"r":0.0,
"f":0.0
},
"ccomp:pmod":{
"p":0.5,
"r":0.6666666667,
"f":0.5714285714
},
"csubj:pass":{
"p":0.0,
"r":0.0,
"f":0.0
},
"cc:preconj":{
"p":0.0,
"r":0.0,
"f":0.0
}
},
"lemma_acc":0.9575746914,
"pos_acc":0.9395242502,
"morph_acc":0.9499516228,
"morph_micro_p":0.9905342532,
"morph_micro_r":0.9576173364,
"morph_micro_f":0.9703717599,
"morph_per_feat":{
"Case":{
"p":0.9934882533,
"r":0.9895714104,
"f":0.9915259637
},
"Gender":{
"p":0.9928157298,
"r":0.9847480935,
"f":0.9887654553
},
"Number":{
"p":0.9909584087,
"r":0.9236279364,
"f":0.9561092634
},
"Person":{
"p":0.9876615746,
"r":0.9905715969,
"f":0.9891144454
},
"PronType":{
"p":0.9944674965,
"r":0.993780235,
"f":0.994123747
},
"Polarity":{
"p":0.9967266776,
"r":0.9983606557,
"f":0.9975429975
},
"AdpType":{
"p":0.9993222636,
"r":0.9979695431,
"f":0.9986454453
},
"Definite":{
"p":0.9916586461,
"r":0.9812698413,
"f":0.9864368917
},
"Degree":{
"p":0.9666212534,
"r":0.9529885829,
"f":0.95975651
},
"VerbForm":{
"p":0.9787798408,
"r":0.9813829787,
"f":0.9800796813
},
"Abbr":{
"p":0.9485981308,
"r":0.90625,
"f":0.9269406393
},
"Poss":{
"p":1.0,
"r":0.9927710843,
"f":0.9963724305
},
"NumForm":{
"p":0.987704918,
"r":0.3319559229,
"f":0.4969072165
},
"NumType":{
"p":0.987804878,
"r":0.3337912088,
"f":0.498973306
},
"Reflex":{
"p":1.0,
"r":0.9935897436,
"f":0.9967845659
},
"Strength":{
"p":0.9841897233,
"r":0.9880952381,
"f":0.9861386139
},
"Mood":{
"p":0.9675675676,
"r":0.9853211009,
"f":0.9763636364
},
"Tense":{
"p":0.9726618705,
"r":0.9825581395,
"f":0.9775849602
},
"Variant":{
"p":0.9932432432,
"r":0.9483870968,
"f":0.9702970297
},
"Position":{
"p":1.0,
"r":0.9910714286,
"f":0.9955156951
},
"Number[psor]":{
"p":1.0,
"r":0.9666666667,
"f":0.9830508475
},
"PartType":{
"p":1.0,
"r":0.9459459459,
"f":0.9722222222
},
"Foreign":{
"p":0.0,
"r":0.0,
"f":0.0
}
},
"ents_p":0.7502799552,
"ents_r":0.7721859393,
"ents_f":0.7610753502,
"ents_per_type":{
"DATETIME":{
"p":0.7745098039,
"r":0.8257839721,
"f":0.7993254637
},
"ORGANIZATION":{
"p":0.696875,
"r":0.7101910828,
"f":0.7034700315
},
"FACILITY":{
"p":0.4890510949,
"r":0.5114503817,
"f":0.5
},
"NUMERIC_VALUE":{
"p":0.9008264463,
"r":0.9237288136,
"f":0.9121338912
},
"ORDINAL":{
"p":0.8392857143,
"r":0.8545454545,
"f":0.8468468468
},
"EVENT":{
"p":0.6060606061,
"r":0.5405405405,
"f":0.5714285714
},
"GPE":{
"p":0.844789357,
"r":0.875862069,
"f":0.8600451467
},
"PERSON":{
"p":0.6865443425,
"r":0.7533557047,
"f":0.7184
},
"NAT_REL_POL":{
"p":0.9507042254,
"r":0.9,
"f":0.9246575342
},
"MONEY":{
"p":1.0,
"r":0.8103448276,
"f":0.8952380952
},
"PRODUCT":{
"p":0.6260162602,
"r":0.5620437956,
"f":0.5923076923
},
"LOC":{
"p":0.4938271605,
"r":0.5263157895,
"f":0.5095541401
},
"WORK_OF_ART":{
"p":0.4666666667,
"r":0.3684210526,
"f":0.4117647059
},
"QUANTITY":{
"p":0.8965517241,
"r":1.0,
"f":0.9454545455
},
"LANGUAGE":{
"p":0.5714285714,
"r":1.0,
"f":0.7272727273
},
"PERIOD":{
"p":0.8888888889,
"r":0.7619047619,
"f":0.8205128205
}
},
"speed":8202.777177355
},
"sources":[
{
"name":"UD Romanian RRT v2.8",
"url":"https://github.com/UniversalDependencies/UD_Romanian-RRT",
"license":"CC BY-SA 4.0",
"author":"Barbu Mititelu, Verginica; Irimia, Elena; Perez, Cenel-Augusto; Ion, Radu; Simionescu, Radu; Popel, Martin"
},
{
"name":"RONEC - the Romanian Named Entity Corpus (ca9ce460)",
"url":"https://github.com/dumitrescustefan/ronec",
"license":"MIT",
"author":"Dumitrescu, Stefan Daniel; Avram, Andrei-Marius; Morogan, Luciana; Toma; Stefan"
},
{
"name":"Explosion fastText Vectors (cbow, OSCAR Common Crawl + Wikipedia)",
"url":"https://spacy.io",
"license":"CC0",
"author":"Explosion"
}
],
"requirements":[
]
}