{ "lang":"nl", "name":"core_news_lg", "version":"3.2.0", "description":"Dutch pipeline optimized for CPU. Components: tok2vec, morphologizer, tagger, parser, senter, ner, attribute_ruler, lemmatizer.", "author":"Explosion", "email":"contact@explosion.ai", "url":"https://explosion.ai", "license":"CC BY-SA 4.0", "spacy_version":">=3.2.0,<3.3.0", "spacy_git_version":"bb26550e2", "vectors":{ "width":300, "vectors":500000, "keys":500000, "name":"nl_vectors" }, "labels":{ "tok2vec":[ ], "morphologizer":[ "POS=PRON|Person=3|PronType=Dem", "Number=Sing|POS=AUX|Tense=Pres|VerbForm=Fin", "POS=ADV", "POS=VERB|VerbForm=Part", "POS=PUNCT", "Number=Sing|POS=AUX|Tense=Past|VerbForm=Fin", "POS=ADP", "POS=NUM", "Number=Plur|POS=NOUN", "POS=VERB|VerbForm=Inf", "POS=SCONJ", "Definite=Def|POS=DET", "Gender=Com|Number=Sing|POS=NOUN", "Number=Sing|POS=VERB|Tense=Pres|VerbForm=Fin", "Degree=Pos|POS=ADJ", "Gender=Neut|Number=Sing|POS=PROPN", "Gender=Com|Number=Sing|POS=PROPN", "POS=AUX|VerbForm=Inf", "Number=Sing|POS=VERB|Tense=Past|VerbForm=Fin", "POS=DET", "Gender=Neut|Number=Sing|POS=NOUN", "POS=PRON|Person=3|PronType=Prs", "POS=CCONJ", "Number=Plur|POS=VERB|Tense=Pres|VerbForm=Fin", "POS=PRON|Person=3|PronType=Ind", "Degree=Cmp|POS=ADJ", "Case=Nom|POS=PRON|Person=1|PronType=Prs", "Definite=Ind|POS=DET", "Case=Nom|POS=PRON|Person=3|PronType=Prs", "POS=PRON|Person=3|Poss=Yes|PronType=Prs", "Number=Plur|POS=AUX|Tense=Pres|VerbForm=Fin", "POS=PRON|PronType=Rel", "Case=Acc|POS=PRON|Person=1|PronType=Prs", "Number=Plur|POS=VERB|Tense=Past|VerbForm=Fin", "Gender=Com,Neut|Number=Sing|POS=NOUN", "Case=Acc|POS=PRON|Person=3|PronType=Prs|Reflex=Yes", "Case=Acc|POS=PRON|Person=3|PronType=Prs", "POS=PROPN", "POS=PRON|PronType=Ind", "POS=PRON|Person=3|PronType=Int", "Case=Acc|POS=PRON|PronType=Rcp", "Number=Plur|POS=AUX|Tense=Past|VerbForm=Fin", "Number=Sing|POS=NOUN", "POS=PRON|Person=1|Poss=Yes|PronType=Prs", "POS=SYM", "Abbr=Yes|POS=X", "Gender=Com,Neut|Number=Sing|POS=PROPN", "Degree=Sup|POS=ADJ", "POS=ADJ", "Number=Sing|POS=PROPN", "POS=PRON|PronType=Dem", "POS=AUX|VerbForm=Part", "POS=PRON|Person=3|PronType=Rel", "Number=Plur|POS=PROPN", "POS=PRON|Person=2|Poss=Yes|PronType=Prs", "Case=Dat|POS=PRON|PronType=Dem", "Case=Nom|POS=PRON|Person=2|PronType=Prs", "POS=INTJ", "Case=Acc|POS=PRON|Person=2|PronType=Prs", "Case=Gen|POS=PRON|Person=3|Poss=Yes|PronType=Prs", "POS=PRON|PronType=Int", "POS=PRON|Person=2|PronType=Prs", "POS=PRON|Person=3", "Case=Gen|POS=PRON|Person=2|PronType=Prs", "POS=X" ], "tagger":[ "ADJ|nom|basis|met-e|mv-n", "ADJ|nom|basis|met-e|zonder-n|bijz", "ADJ|nom|basis|met-e|zonder-n|stan", "ADJ|nom|basis|zonder|mv-n", "ADJ|nom|basis|zonder|zonder-n", "ADJ|nom|comp|met-e|mv-n", "ADJ|nom|comp|met-e|zonder-n|stan", "ADJ|nom|sup|met-e|mv-n", "ADJ|nom|sup|met-e|zonder-n|bijz", "ADJ|nom|sup|met-e|zonder-n|stan", "ADJ|nom|sup|zonder|zonder-n", "ADJ|postnom|basis|met-s", "ADJ|postnom|basis|zonder", "ADJ|postnom|comp|met-s", "ADJ|prenom|basis|met-e|bijz", "ADJ|prenom|basis|met-e|stan", "ADJ|prenom|basis|zonder", "ADJ|prenom|comp|met-e|stan", "ADJ|prenom|comp|zonder", "ADJ|prenom|sup|met-e|stan", "ADJ|prenom|sup|zonder", "ADJ|vrij|basis|zonder", "ADJ|vrij|comp|zonder", "ADJ|vrij|dim|zonder", "ADJ|vrij|sup|zonder", "BW", "LET", "LID|bep|dat|evmo", "LID|bep|gen|evmo", "LID|bep|gen|rest3", "LID|bep|stan|evon", "LID|bep|stan|rest", "LID|onbep|stan|agr", "N|eigen|ev|basis|gen", "N|eigen|ev|basis|genus|stan", "N|eigen|ev|basis|onz|stan", "N|eigen|ev|basis|zijd|stan", "N|eigen|ev|dim|onz|stan", "N|eigen|mv|basis", "N|soort|ev|basis|dat", "N|soort|ev|basis|gen", "N|soort|ev|basis|genus|stan", "N|soort|ev|basis|onz|stan", "N|soort|ev|basis|zijd|stan", "N|soort|ev|dim|onz|stan", "N|soort|mv|basis", "N|soort|mv|dim", "SPEC|afgebr", "SPEC|afk", "SPEC|deeleigen", "SPEC|enof", "SPEC|meta", "SPEC|symb", "SPEC|vreemd", "TSW", "TW|hoofd|nom|mv-n|basis", "TW|hoofd|nom|mv-n|dim", "TW|hoofd|nom|zonder-n|basis", "TW|hoofd|nom|zonder-n|dim", "TW|hoofd|prenom|stan", "TW|hoofd|vrij", "TW|rang|nom|mv-n", "TW|rang|nom|zonder-n", "TW|rang|prenom|stan", "VG|neven", "VG|onder", "VNW|aanw|adv-pron|obl|vol|3o|getal", "VNW|aanw|adv-pron|stan|red|3|getal", "VNW|aanw|det|dat|nom|met-e|zonder-n", "VNW|aanw|det|dat|prenom|met-e|evmo", "VNW|aanw|det|gen|prenom|met-e|rest3", "VNW|aanw|det|stan|nom|met-e|mv-n", "VNW|aanw|det|stan|nom|met-e|zonder-n", "VNW|aanw|det|stan|prenom|met-e|rest", "VNW|aanw|det|stan|prenom|zonder|agr", "VNW|aanw|det|stan|prenom|zonder|evon", "VNW|aanw|det|stan|prenom|zonder|rest", "VNW|aanw|det|stan|vrij|zonder", "VNW|aanw|pron|gen|vol|3m|ev", "VNW|aanw|pron|stan|vol|3o|ev", "VNW|aanw|pron|stan|vol|3|getal", "VNW|betr|det|stan|nom|met-e|zonder-n", "VNW|betr|det|stan|nom|zonder|zonder-n", "VNW|betr|pron|stan|vol|3|ev", "VNW|betr|pron|stan|vol|persoon|getal", "VNW|bez|det|gen|vol|3|ev|prenom|met-e|rest3", "VNW|bez|det|stan|nadr|2v|mv|prenom|zonder|agr", "VNW|bez|det|stan|red|1|ev|prenom|zonder|agr", "VNW|bez|det|stan|red|2v|ev|prenom|zonder|agr", "VNW|bez|det|stan|red|3|ev|prenom|zonder|agr", "VNW|bez|det|stan|vol|1|ev|prenom|met-e|rest", "VNW|bez|det|stan|vol|1|ev|prenom|zonder|agr", "VNW|bez|det|stan|vol|1|mv|prenom|met-e|rest", "VNW|bez|det|stan|vol|1|mv|prenom|zonder|evon", "VNW|bez|det|stan|vol|2v|ev|prenom|zonder|agr", "VNW|bez|det|stan|vol|2|getal|prenom|zonder|agr", "VNW|bez|det|stan|vol|3m|ev|nom|met-e|zonder-n", "VNW|bez|det|stan|vol|3m|ev|prenom|met-e|rest", "VNW|bez|det|stan|vol|3p|mv|prenom|met-e|rest", "VNW|bez|det|stan|vol|3v|ev|nom|met-e|zonder-n", "VNW|bez|det|stan|vol|3v|ev|prenom|met-e|rest", "VNW|bez|det|stan|vol|3|ev|prenom|zonder|agr", "VNW|bez|det|stan|vol|3|mv|prenom|zonder|agr", "VNW|excl|pron|stan|vol|3|getal", "VNW|onbep|adv-pron|gen|red|3|getal", "VNW|onbep|adv-pron|obl|vol|3o|getal", "VNW|onbep|det|stan|nom|met-e|mv-n", "VNW|onbep|det|stan|nom|met-e|zonder-n", "VNW|onbep|det|stan|nom|zonder|zonder-n", "VNW|onbep|det|stan|prenom|met-e|agr", "VNW|onbep|det|stan|prenom|met-e|evz", "VNW|onbep|det|stan|prenom|met-e|mv", "VNW|onbep|det|stan|prenom|met-e|rest", "VNW|onbep|det|stan|prenom|zonder|agr", "VNW|onbep|det|stan|prenom|zonder|evon", "VNW|onbep|det|stan|vrij|zonder", "VNW|onbep|grad|gen|nom|met-e|mv-n|basis", "VNW|onbep|grad|stan|nom|met-e|mv-n|basis", "VNW|onbep|grad|stan|nom|met-e|mv-n|sup", "VNW|onbep|grad|stan|nom|met-e|zonder-n|basis", "VNW|onbep|grad|stan|nom|met-e|zonder-n|sup", "VNW|onbep|grad|stan|prenom|met-e|agr|basis", "VNW|onbep|grad|stan|prenom|met-e|agr|comp", "VNW|onbep|grad|stan|prenom|met-e|agr|sup", "VNW|onbep|grad|stan|prenom|met-e|mv|basis", "VNW|onbep|grad|stan|prenom|zonder|agr|basis", "VNW|onbep|grad|stan|prenom|zonder|agr|comp", "VNW|onbep|grad|stan|vrij|zonder|basis", "VNW|onbep|grad|stan|vrij|zonder|comp", "VNW|onbep|grad|stan|vrij|zonder|sup", "VNW|onbep|pron|gen|vol|3p|ev", "VNW|onbep|pron|stan|vol|3o|ev", "VNW|onbep|pron|stan|vol|3p|ev", "VNW|pers|pron|gen|vol|2|getal", "VNW|pers|pron|nomin|nadr|3m|ev|masc", "VNW|pers|pron|nomin|nadr|3v|ev|fem", "VNW|pers|pron|nomin|red|1|mv", "VNW|pers|pron|nomin|red|2v|ev", "VNW|pers|pron|nomin|red|2|getal", "VNW|pers|pron|nomin|red|3p|ev|masc", "VNW|pers|pron|nomin|red|3|ev|masc", "VNW|pers|pron|nomin|vol|1|ev", "VNW|pers|pron|nomin|vol|1|mv", "VNW|pers|pron|nomin|vol|2b|getal", "VNW|pers|pron|nomin|vol|2v|ev", "VNW|pers|pron|nomin|vol|2|getal", "VNW|pers|pron|nomin|vol|3p|mv", "VNW|pers|pron|nomin|vol|3v|ev|fem", "VNW|pers|pron|nomin|vol|3|ev|masc", "VNW|pers|pron|obl|nadr|3m|ev|masc", "VNW|pers|pron|obl|red|3|ev|masc", "VNW|pers|pron|obl|vol|2v|ev", "VNW|pers|pron|obl|vol|3p|mv", "VNW|pers|pron|obl|vol|3|ev|masc", "VNW|pers|pron|obl|vol|3|getal|fem", "VNW|pers|pron|stan|nadr|2v|mv", "VNW|pers|pron|stan|red|3|ev|fem", "VNW|pers|pron|stan|red|3|ev|onz", "VNW|pers|pron|stan|red|3|mv", "VNW|pr|pron|obl|nadr|1|ev", "VNW|pr|pron|obl|nadr|2v|getal", "VNW|pr|pron|obl|nadr|2|getal", "VNW|pr|pron|obl|red|1|ev", "VNW|pr|pron|obl|red|2v|getal", "VNW|pr|pron|obl|vol|1|ev", "VNW|pr|pron|obl|vol|1|mv", "VNW|pr|pron|obl|vol|2|getal", "VNW|recip|pron|gen|vol|persoon|mv", "VNW|recip|pron|obl|vol|persoon|mv", "VNW|refl|pron|obl|nadr|3|getal", "VNW|refl|pron|obl|red|3|getal", "VNW|vb|adv-pron|obl|vol|3o|getal", "VNW|vb|det|stan|nom|met-e|zonder-n", "VNW|vb|det|stan|prenom|met-e|rest", "VNW|vb|det|stan|prenom|zonder|evon", "VNW|vb|pron|gen|vol|3m|ev", "VNW|vb|pron|gen|vol|3p|mv", "VNW|vb|pron|gen|vol|3v|ev", "VNW|vb|pron|stan|vol|3o|ev", "VNW|vb|pron|stan|vol|3p|getal", "VZ|fin", "VZ|init", "VZ|versm", "WW|inf|nom|zonder|zonder-n", "WW|inf|prenom|met-e", "WW|inf|vrij|zonder", "WW|od|nom|met-e|mv-n", "WW|od|nom|met-e|zonder-n", "WW|od|prenom|met-e", "WW|od|prenom|zonder", "WW|od|vrij|zonder", "WW|pv|conj|ev", "WW|pv|tgw|ev", "WW|pv|tgw|met-t", "WW|pv|tgw|mv", "WW|pv|verl|ev", "WW|pv|verl|mv", "WW|vd|nom|met-e|mv-n", "WW|vd|nom|met-e|zonder-n", "WW|vd|prenom|met-e", "WW|vd|prenom|zonder", "WW|vd|vrij|zonder" ], "parser":[ "ROOT", "acl", "acl:relcl", "advcl", "advmod", "amod", "appos", "aux", "aux:pass", "case", "cc", "ccomp", "compound:prt", "conj", "cop", "csubj", "dep", "det", "expl", "expl:pv", "fixed", "flat", "iobj", "mark", "nmod", "nmod:poss", "nsubj", "nsubj:pass", "nummod", "obj", "obl", "obl:agent", "orphan", "parataxis", "punct", "xcomp" ], "senter":[ "I", "S" ], "attribute_ruler":[ ], "lemmatizer":[ ], "ner":[ "CARDINAL", "DATE", "EVENT", "FAC", "GPE", "LANGUAGE", "LAW", "LOC", "MONEY", "NORP", "ORDINAL", "ORG", "PERCENT", "PERSON", "PRODUCT", "QUANTITY", "TIME", "WORK_OF_ART" ] }, "pipeline":[ "tok2vec", "morphologizer", "tagger", "parser", "attribute_ruler", "lemmatizer", "ner" ], "components":[ "tok2vec", "morphologizer", "tagger", "parser", "senter", "attribute_ruler", "lemmatizer", "ner" ], "disabled":[ "senter" ], "performance":{ "token_acc":0.9997165842, "token_p":0.9974281853, "token_r":0.9975586363, "token_f":0.9974934066, "pos_acc":0.9667175573, "morph_acc":0.9649471044, "morph_micro_p":0.9743803954, "morph_micro_r":0.9558803442, "morph_micro_f":0.9650417155, "morph_per_feat":{ "Person":{ "p":0.9921875, "r":0.9713193117, "f":0.9816425121 }, "Poss":{ "p":0.9885496183, "r":0.9923371648, "f":0.9904397706 }, "PronType":{ "p":0.9914529915, "r":0.9642560266, "f":0.9776654024 }, "Gender":{ "p":0.9408033827, "r":0.9056219791, "f":0.9228775113 }, "Number":{ "p":0.9837895703, "r":0.9628798084, "f":0.9732223903 }, "Tense":{ "p":0.9777901166, "r":0.9681143485, "f":0.9729281768 }, "VerbForm":{ "p":0.9640653358, "r":0.9557394746, "f":0.9598843513 }, "Degree":{ "p":0.9628550619, "r":0.9497126437, "f":0.956238698 }, "Definite":{ "p":0.9955869373, "r":0.9929577465, "f":0.9942706038 }, "Case":{ "p":0.998003992, "r":0.9960159363, "f":0.9970089731 }, "Reflex":{ "p":1.0, "r":1.0, "f":1.0 }, "Abbr":{ "p":1.0, "r":0.6666666667, "f":0.8 } }, "tag_acc":0.9543293348, "sents_p":0.866340098, "sents_r":0.8880918221, "sents_f":0.8770811194, "dep_uas":0.8701736595, "dep_las":0.8260704236, "dep_las_per_type":{ "det":{ "p":0.8869644485, "r":0.959566075, "f":0.9218379915 }, "nsubj":{ "p":0.7900466563, "r":0.8246753247, "f":0.8069896743 }, "root":{ "p":0.7489932886, "r":0.8328358209, "f":0.7886925795 }, "case":{ "p":0.8836805556, "r":0.9382488479, "f":0.910147519 }, "obl":{ "p":0.7313195548, "r":0.7290015848, "f":0.7301587302 }, "nmod":{ "p":0.596651446, "r":0.6841186736, "f":0.637398374 }, "advmod":{ "p":0.75, "r":0.7696969697, "f":0.7597208375 }, "obj":{ "p":0.7902621723, "r":0.778597786, "f":0.7843866171 }, "mark":{ "p":0.8445378151, "r":0.8305785124, "f":0.8375 }, "advcl":{ "p":0.5137614679, "r":0.4628099174, "f":0.4869565217 }, "amod":{ "p":0.7834710744, "r":0.8649635036, "f":0.8222029488 }, "acl:relcl":{ "p":0.6352941176, "r":0.6585365854, "f":0.6467065868 }, "cop":{ "p":0.7862068966, "r":0.6263736264, "f":0.6972477064 }, "cc":{ "p":0.8, "r":0.8384879725, "f":0.8187919463 }, "conj":{ "p":0.5825242718, "r":0.5309734513, "f":0.5555555556 }, "fixed":{ "p":0.6690647482, "r":0.2520325203, "f":0.3661417323 }, "flat":{ "p":0.7995991984, "r":0.6797274276, "f":0.7348066298 }, "csubj":{ "p":0.5, "r":0.1666666667, "f":0.25 }, "aux":{ "p":0.7714285714, "r":0.786407767, "f":0.7788461538 }, "compound:prt":{ "p":0.776119403, "r":0.6753246753, "f":0.7222222222 }, "nummod":{ "p":0.59375, "r":0.6506849315, "f":0.6209150327 }, "acl":{ "p":0.5098039216, "r":0.4406779661, "f":0.4727272727 }, "expl":{ "p":0.4, "r":0.3333333333, "f":0.3636363636 }, "appos":{ "p":0.5625, "r":0.4682080925, "f":0.5110410095 }, "nsubj:pass":{ "p":0.8023255814, "r":0.8023255814, "f":0.8023255814 }, "aux:pass":{ "p":0.8823529412, "r":0.9183673469, "f":0.9 }, "ccomp":{ "p":0.6666666667, "r":0.5294117647, "f":0.5901639344 }, "xcomp":{ "p":0.4285714286, "r":0.698630137, "f":0.53125 }, "parataxis":{ "p":0.3644067797, "r":0.288590604, "f":0.3220973783 }, "expl:pv":{ "p":0.7894736842, "r":0.7894736842, "f":0.7894736842 }, "iobj":{ "p":0.4444444444, "r":0.4, "f":0.4210526316 }, "nmod:poss":{ "p":0.8616352201, "r":0.8954248366, "f":0.8782051282 }, "dep":{ "p":0.0, "r":0.0, "f":0.0 }, "obl:agent":{ "p":0.8461538462, "r":0.7857142857, "f":0.8148148148 }, "orphan":{ "p":0.0, "r":0.0, "f":0.0 } }, "lemma_acc":0.8159277755, "ents_p":0.7772241993, "ents_r":0.755186722, "ents_f":0.7660470011, "ents_per_type":{ "DATE":{ "p":0.931372549, "r":0.9253246753, "f":0.9283387622 }, "NORP":{ "p":0.8181818182, "r":0.8674698795, "f":0.8421052632 }, "ORG":{ "p":0.6959459459, "r":0.6094674556, "f":0.6498422713 }, "CARDINAL":{ "p":0.8607594937, "r":0.9714285714, "f":0.9127516779 }, "GPE":{ "p":0.785046729, "r":0.9230769231, "f":0.8484848485 }, "QUANTITY":{ "p":0.8571428571, "r":1.0, "f":0.9230769231 }, "PERCENT":{ "p":1.0, "r":0.8333333333, "f":0.9090909091 }, "PERSON":{ "p":0.7788778878, "r":0.7637540453, "f":0.7712418301 }, "LAW":{ "p":1.0, "r":0.3333333333, "f":0.5 }, "EVENT":{ "p":0.4761904762, "r":0.4347826087, "f":0.4545454545 }, "WORK_OF_ART":{ "p":0.5882352941, "r":0.4444444444, "f":0.5063291139 }, "ORDINAL":{ "p":0.96875, "r":0.9393939394, "f":0.9538461538 }, "LANGUAGE":{ "p":0.75, "r":0.8181818182, "f":0.7826086957 }, "LOC":{ "p":0.5333333333, "r":0.2352941176, "f":0.3265306122 }, "FAC":{ "p":0.1, "r":0.2142857143, "f":0.1363636364 }, "PRODUCT":{ "p":0.0, "r":0.0, "f":0.0 }, "MONEY":{ "p":0.0, "r":0.0, "f":0.0 }, "TIME":{ "p":1.0, "r":1.0, "f":1.0 } }, "speed":3053.5292904657 }, "sources":[ { "name":"UD Dutch LassySmall v2.8", "url":"https://github.com/UniversalDependencies/UD_Dutch-LassySmall", "license":"CC BY-SA 4.0", "author":"Bouma, Gosse; van Noord, Gertjan" }, { "name":"Dutch NER Annotations for UD LassySmall", "url":"https://nlp.town", "license":"CC BY-SA 4.0", "author":"NLP Town" }, { "name":"UD Dutch LassySmall v2.8", "url":"https://github.com/UniversalDependencies/UD_Dutch-LassySmall", "license":"CC BY-SA 4.0", "author":"Bouma, Gosse; van Noord, Gertjan" }, { "name":"UD Dutch Alpino v2.8", "url":"https://github.com/UniversalDependencies/UD_Dutch-Alpino", "license":"CC BY-SA 4.0", "author":"Zeman, Daniel; \u017dabokrtsk\u00fd, Zden\u011bk; Bouma, Gosse; van Noord, Gertjan" }, { "name":"spaCy lookups data", "author":"Explosion", "url":"https://github.com/explosion/spacy-lookups-data", "license":"MIT" }, { "name":"Explosion fastText Vectors (cbow, OSCAR Common Crawl + Wikipedia)", "url":"https://spacy.io", "license":"CC0", "author":"Explosion" } ], "requirements":[ ] }