adrianeboyd commited on
Commit
7881ad7
1 Parent(s): 2745607

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,62 +14,62 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.7655003069
18
  - name: NER Recall
19
  type: recall
20
- value: 0.7387440758
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.7518842327
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
- value: 0.9671340808
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
- value: 0.9671340808
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
- value: 0.9532993525
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
- value: 0.9686243182
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
- value: 0.8826525829
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
- value: 0.84903125
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
- value: 0.9264766625
73
  ---
74
  ### Details: https://spacy.io/models/nb#nb_core_news_sm
75
 
@@ -78,8 +78,8 @@ Norwegian (Bokmål) pipeline optimized for CPU. Components: tok2vec, morphologiz
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `nb_core_news_sm` |
81
- | **Version** | `3.3.0` |
82
- | **spaCy** | `>=3.3.0.dev0,<3.4.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -91,11 +91,11 @@ Norwegian (Bokmål) pipeline optimized for CPU. Components: tok2vec, morphologiz
91
 
92
  <details>
93
 
94
- <summary>View label scheme (248 labels for 3 components)</summary>
95
 
96
  | Component | Labels |
97
  | --- | --- |
98
- | **`morphologizer`** | `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=CCONJ`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=NOUN`, `POS=SCONJ`, `Definite=Def\|Gender=Masc\|Number=Sing\|POS=NOUN`, `Definite=Ind\|Gender=Neut\|Number=Plur\|POS=NOUN`, `POS=PUNCT`, `Mood=Ind\|POS=VERB\|Tense=Past\|VerbForm=Fin`, `POS=ADP`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `Definite=Def\|Degree=Pos\|Number=Sing\|POS=ADJ`, `POS=PROPN`, `POS=X`, `Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin`, `Definite=Def\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=PRON\|PronType=Rel`, `Mood=Ind\|POS=AUX\|Tense=Pres\|VerbForm=Fin`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Definite=Ind\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Definite=Ind\|Gender=Fem\|Number=Sing\|POS=NOUN`, `Number=Plur\|POS=ADJ\|VerbForm=Part`, `Definite=Ind\|Gender=Fem\|Number=Plur\|POS=NOUN`, `POS=ADV`, `Gender=Neut\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Definite=Ind\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `POS=VERB\|VerbForm=Part`, `Definite=Ind\|Gender=Masc\|Number=Plur\|POS=NOUN`, `Definite=Ind\|Degree=Pos\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Degree=Pos\|Number=Plur\|POS=ADJ`, `NumType=Card\|Number=Plur\|POS=NUM`, `Definite=Def\|Gender=Masc\|Number=Plur\|POS=NOUN`, `Case=Acc\|POS=PRON\|PronType=Prs\|Reflex=Yes`, `Case=Gen\|Definite=Ind\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=PART`, `POS=VERB\|VerbForm=Inf`, `Case=Nom\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Mood=Ind\|POS=AUX\|Tense=Past\|VerbForm=Fin`, `Gender=Fem\|POS=PROPN`, `POS=NOUN`, `Gender=Masc\|POS=PROPN`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `Case=Gen\|Definite=Def\|Gender=Masc\|Number=Sing\|POS=NOUN`, `Abbr=Yes\|POS=PROPN`, `POS=PART\|Polarity=Neg`, `Number=Plur\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Case=Gen\|POS=PROPN`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Masc\|Number=Sing\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Degree=Sup\|POS=ADJ`, `Case=Gen\|Gender=Fem\|POS=PROPN`, `Number=Plur\|POS=DET\|PronType=Dem`, `Case=Gen\|Definite=Def\|Gender=Neut\|Number=Sing\|POS=NOUN`, `Definite=Ind\|Degree=Sup\|POS=ADJ`, `Definite=Def\|Gender=Fem\|Number=Plur\|POS=NOUN`, `Gender=Neut\|POS=PROPN`, `Number=Plur\|POS=DET\|PronType=Int`, `Definite=Def\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Definite=Def\|POS=DET\|PronType=Dem`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Art`, `Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin\|Voice=Pass`, `Abbr=Yes\|Case=Gen\|POS=PROPN`, `Animacy=Hum\|Case=Nom\|Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Degree=Cmp\|POS=ADJ`, `POS=ADJ\|VerbForm=Part`, `Gender=Neut\|Number=Sing\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Abbr=Yes\|POS=ADP`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=DET\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Neut\|Number=Plur\|POS=NOUN`, `POS=AUX\|VerbForm=Part`, `POS=PRON\|PronType=Int`, `Gender=Fem\|Number=Sing\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Number=Plur\|POS=PRON\|Person=3\|PronType=Ind,Prs`, `Number=Plur\|POS=DET\|PronType=Ind`, `Degree=Pos\|POS=ADJ`, `Animacy=Hum\|Case=Nom\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `POS=VERB\|VerbForm=Inf\|Voice=Pass`, `Definite=Ind\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Ind`, `Animacy=Hum\|Case=Acc\|Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Animacy=Hum\|Case=Nom\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Number=Plur\|POS=DET\|Polarity=Neg\|PronType=Neg`, `NumType=Card\|POS=NUM`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Ind`, `POS=DET\|PronType=Prs`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Ind`, `Case=Gen\|Gender=Neut\|POS=PROPN`, `Gender=Masc\|Number=Sing\|POS=DET\|Polarity=Neg\|PronType=Neg`, `Definite=Def\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `POS=AUX\|VerbForm=Inf`, `Case=Acc\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Case=Gen\|Degree=Pos\|Number=Plur\|POS=ADJ`, `Number=Plur\|POS=DET\|PronType=Tot`, `Case=Gen\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `Number=Plur\|POS=DET\|PronType=Prs`, `POS=SYM`, `Gender=Neut\|NumType=Card\|Number=Sing\|POS=NUM`, `Animacy=Hum\|Case=Nom\|Number=Sing\|POS=PRON\|PronType=Prs`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Gender=Masc\|Number=Sing\|POS=NOUN`, `Abbr=Yes\|POS=ADV`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Tot`, `Definite=Def\|POS=DET\|PronType=Prs`, `Animacy=Hum\|Case=Nom\|Gender=Fem\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Neut\|POS=NOUN`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Int`, `Definite=Def\|NumType=Card\|POS=NUM`, `Mood=Imp\|POS=VERB\|VerbForm=Fin`, `Definite=Ind\|Number=Plur\|POS=NOUN`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Tot`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Tot`, `Animacy=Hum\|Case=Acc\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|Polarity=Neg\|PronType=Neg,Prs`, `Number=Plur\|POS=PRON\|Person=3\|Polarity=Neg\|PronType=Neg,Prs`, `Definite=Def\|NumType=Card\|Number=Sing\|POS=NUM`, `Gender=Masc\|NumType=Card\|Number=Sing\|POS=NUM`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `Case=Gen\|Definite=Def\|Gender=Fem\|Number=Plur\|POS=NOUN`, `Case=Gen\|Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem`, `Animacy=Hum\|Number=Sing\|POS=PRON\|PronType=Art,Prs`, `Mood=Imp\|POS=AUX\|VerbForm=Fin`, `Number=Plur\|POS=PRON\|Person=3\|PronType=Prs,Tot`, `Number=Plur\|POS=ADJ`, `Gender=Masc\|POS=NOUN`, `Abbr=Yes\|POS=NOUN`, `Case=Gen\|Definite=Ind\|Gender=Masc\|Number=Plur\|POS=NOUN`, `Gender=Neut\|Number=Sing\|POS=PRON\|Person=3\|PronType=Ind,Prs`, `POS=INTJ`, `Animacy=Hum\|Case=Nom\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Animacy=Hum\|Case=Acc\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Masc\|Number=Plur\|POS=NOUN`, `POS=ADJ`, `Animacy=Hum\|Case=Acc\|Gender=Fem\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Animacy=Hum\|Case=Acc\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=NOUN`, `Number=Sing\|POS=PRON\|Polarity=Neg\|PronType=Neg`, `Case=Gen\|POS=NOUN`, `Definite=Ind\|Number=Sing\|POS=ADJ`, `Case=Gen\|Gender=Masc\|POS=PROPN`, `Animacy=Hum\|Number=Plur\|POS=PRON\|PronType=Rcp`, `Case=Gen\|Definite=Ind\|Gender=Fem\|Number=Sing\|POS=NOUN`, `Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Ind,Prs`, `Definite=Ind\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Fem\|Number=Sing\|POS=NOUN`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Art`, `Case=Gen\|Definite=Def\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Int`, `NumType=Card\|Number=Sing\|POS=NUM`, `Animacy=Hum\|Case=Acc\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Animacy=Hum\|Case=Nom\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Degree=Pos\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Degree=Sup\|POS=ADJ`, `Animacy=Hum\|POS=PRON\|PronType=Int`, `POS=DET\|PronType=Ind`, `Definite=Def\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Fem\|POS=NOUN`, `Case=Gen\|Number=Plur\|POS=DET\|PronType=Dem`, `Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs,Tot`, `Case=Gen\|Definite=Ind\|Gender=Fem\|Number=Plur\|POS=NOUN`, `Gender=Neut\|Number=Sing\|POS=DET\|Polarity=Neg\|PronType=Neg`, `Number=Plur\|POS=NOUN`, `POS=PRON\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Definite=Ind\|Number=Sing\|POS=VERB\|VerbForm=Part`, `Case=Gen\|Definite=Def\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Mood=Ind\|POS=VERB\|Tense=Past\|VerbForm=Fin\|Voice=Pass`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem,Ind`, `Animacy=Hum\|POS=PRON\|Poss=Yes\|PronType=Int`, `Abbr=Yes\|POS=ADJ`, `Case=Gen\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `Abbr=Yes\|Definite=Def,Ind\|Gender=Masc\|Number=Sing\|POS=NOUN`, `Case=Gen\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Dem`, `Number=Plur\|POS=PRON\|Poss=Yes\|PronType=Rcp`, `Definite=Ind\|Degree=Pos\|POS=ADJ`, `Number=Plur\|POS=DET\|PronType=Art`, `Case=Gen\|NumType=Card\|Number=Plur\|POS=NUM`, `Abbr=Yes\|Definite=Def,Ind\|Gender=Neut\|Number=Plur,Sing\|POS=NOUN`, `Case=Gen\|Number=Plur\|POS=DET\|PronType=Tot`, `Abbr=Yes\|Definite=Def,Ind\|Gender=Masc\|Number=Plur,Sing\|POS=NOUN`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Int`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Case=Gen\|Definite=Ind\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Prs`, `Animacy=Hum\|Case=Gen,Nom\|Number=Sing\|POS=PRON\|PronType=Art,Prs`, `Definite=Def\|Degree=Pos\|Gender=Masc\|Number=Sing\|POS=ADJ`, `Animacy=Hum\|Case=Gen\|Number=Sing\|POS=PRON\|PronType=Art,Prs`, `Gender=Fem\|NumType=Card\|Number=Sing\|POS=NUM`, `Definite=Ind\|Gender=Masc\|POS=NOUN`, `Definite=Def\|Number=Plur\|POS=NOUN`, `Number=Sing\|POS=ADJ\|VerbForm=Part`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Abbr=Yes\|Gender=Masc\|POS=NOUN`, `Abbr=Yes\|Case=Gen\|POS=NOUN`, `Abbr=Yes\|Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin`, `Abbr=Yes\|Degree=Pos\|POS=ADJ`, `Case=Gen\|Gender=Fem\|POS=NOUN`, `Case=Gen\|Degree=Cmp\|POS=ADJ`, `Definite=Ind\|Degree=Pos\|Gender=Masc\|Number=Sing\|POS=ADJ`, `Gender=Masc\|Number=Sing\|POS=NOUN` |
99
  | **`parser`** | `ROOT`, `acl`, `acl:cleft`, `acl:relcl`, `advcl`, `advmod`, `amod`, `appos`, `aux`, `aux:pass`, `case`, `cc`, `ccomp`, `compound`, `compound:prt`, `conj`, `cop`, `csubj`, `dep`, `det`, `discourse`, `expl`, `flat:foreign`, `flat:name`, `iobj`, `mark`, `nmod`, `nsubj`, `nsubj:pass`, `nummod`, `obj`, `obl`, `orphan`, `parataxis`, `punct`, `xcomp` |
100
  | **`ner`** | `DRV`, `EVT`, `GPE_LOC`, `GPE_ORG`, `LOC`, `MISC`, `ORG`, `PER`, `PROD` |
101
 
@@ -109,18 +109,18 @@ Norwegian (Bokmål) pipeline optimized for CPU. Components: tok2vec, morphologiz
109
  | `TOKEN_P` | 99.71 |
110
  | `TOKEN_R` | 99.53 |
111
  | `TOKEN_F` | 99.62 |
112
- | `POS_ACC` | 96.71 |
113
- | `MORPH_ACC` | 95.33 |
114
- | `MORPH_MICRO_P` | 97.02 |
115
- | `MORPH_MICRO_R` | 96.19 |
116
- | `MORPH_MICRO_F` | 96.60 |
117
- | `SENTS_P` | 92.19 |
118
- | `SENTS_R` | 93.11 |
119
- | `SENTS_F` | 92.65 |
120
- | `DEP_UAS` | 88.27 |
121
- | `DEP_LAS` | 84.90 |
122
- | `LEMMA_ACC` | 96.86 |
123
- | `TAG_ACC` | 96.71 |
124
- | `ENTS_P` | 76.55 |
125
- | `ENTS_R` | 73.87 |
126
- | `ENTS_F` | 75.19 |
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.7702786378
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.7369668246
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.753254617
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.9676832796
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
+ value: 0.9676832796
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
+ value: 0.9535447607
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
+ value: 0.9687620517
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
+ value: 0.8828806301
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
+ value: 0.8486771164
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
+ value: 0.9338860104
73
  ---
74
  ### Details: https://spacy.io/models/nb#nb_core_news_sm
75
 
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `nb_core_news_sm` |
81
+ | **Version** | `3.4.0` |
82
+ | **spaCy** | `>=3.4.0,<3.5.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
91
 
92
  <details>
93
 
94
+ <summary>View label scheme (249 labels for 3 components)</summary>
95
 
96
  | Component | Labels |
97
  | --- | --- |
98
+ | **`morphologizer`** | `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=CCONJ`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=NOUN`, `POS=SCONJ`, `Definite=Def\|Gender=Masc\|Number=Sing\|POS=NOUN`, `Definite=Ind\|Gender=Neut\|Number=Plur\|POS=NOUN`, `POS=PUNCT`, `Mood=Ind\|POS=VERB\|Tense=Past\|VerbForm=Fin`, `POS=ADP`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `Definite=Def\|Degree=Pos\|Number=Sing\|POS=ADJ`, `POS=PROPN`, `POS=X`, `Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin`, `Definite=Def\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=PRON\|PronType=Rel`, `Mood=Ind\|POS=AUX\|Tense=Pres\|VerbForm=Fin`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Definite=Ind\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Definite=Ind\|Gender=Fem\|Number=Sing\|POS=NOUN`, `Number=Plur\|POS=ADJ\|VerbForm=Part`, `Definite=Ind\|Gender=Fem\|Number=Plur\|POS=NOUN`, `POS=ADV`, `Gender=Neut\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Definite=Ind\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `POS=VERB\|VerbForm=Part`, `Definite=Ind\|Gender=Masc\|Number=Plur\|POS=NOUN`, `Definite=Ind\|Degree=Pos\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Degree=Pos\|Number=Plur\|POS=ADJ`, `NumType=Card\|Number=Plur\|POS=NUM`, `Definite=Def\|Gender=Masc\|Number=Plur\|POS=NOUN`, `Case=Acc\|POS=PRON\|PronType=Prs\|Reflex=Yes`, `Case=Gen\|Definite=Ind\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=PART`, `POS=VERB\|VerbForm=Inf`, `Case=Nom\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Mood=Ind\|POS=AUX\|Tense=Past\|VerbForm=Fin`, `Gender=Fem\|POS=PROPN`, `POS=NOUN`, `Gender=Masc\|POS=PROPN`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `Case=Gen\|Definite=Def\|Gender=Masc\|Number=Sing\|POS=NOUN`, `Abbr=Yes\|POS=PROPN`, `POS=PART\|Polarity=Neg`, `Number=Plur\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Case=Gen\|POS=PROPN`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Masc\|Number=Sing\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Degree=Sup\|POS=ADJ`, `Case=Gen\|Gender=Fem\|POS=PROPN`, `Number=Plur\|POS=DET\|PronType=Dem`, `Case=Gen\|Definite=Def\|Gender=Neut\|Number=Sing\|POS=NOUN`, `Definite=Ind\|Degree=Sup\|POS=ADJ`, `Definite=Def\|Gender=Fem\|Number=Plur\|POS=NOUN`, `Gender=Neut\|POS=PROPN`, `Number=Plur\|POS=DET\|PronType=Int`, `Definite=Def\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Definite=Def\|POS=DET\|PronType=Dem`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Art`, `Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin\|Voice=Pass`, `Abbr=Yes\|Case=Gen\|POS=PROPN`, `Animacy=Hum\|Case=Nom\|Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Degree=Cmp\|POS=ADJ`, `POS=ADJ\|VerbForm=Part`, `Gender=Neut\|Number=Sing\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Abbr=Yes\|POS=ADP`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=DET\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Neut\|Number=Plur\|POS=NOUN`, `POS=AUX\|VerbForm=Part`, `POS=PRON\|PronType=Int`, `Gender=Fem\|Number=Sing\|POS=PRON\|Poss=Yes\|PronType=Prs`, `Number=Plur\|POS=PRON\|Person=3\|PronType=Ind,Prs`, `Number=Plur\|POS=DET\|PronType=Ind`, `Degree=Pos\|POS=ADJ`, `Animacy=Hum\|Case=Nom\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `POS=VERB\|VerbForm=Inf\|Voice=Pass`, `Definite=Ind\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Ind`, `Animacy=Hum\|Case=Acc\|Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Animacy=Hum\|Case=Nom\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Number=Plur\|POS=DET\|Polarity=Neg\|PronType=Neg`, `NumType=Card\|POS=NUM`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Ind`, `POS=DET\|PronType=Prs`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Ind`, `Case=Gen\|Gender=Neut\|POS=PROPN`, `Gender=Masc\|Number=Sing\|POS=DET\|Polarity=Neg\|PronType=Neg`, `Definite=Def\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `POS=AUX\|VerbForm=Inf`, `Case=Acc\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Case=Gen\|Degree=Pos\|Number=Plur\|POS=ADJ`, `Number=Plur\|POS=DET\|PronType=Tot`, `Case=Gen\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `Number=Plur\|POS=DET\|PronType=Prs`, `POS=SYM`, `Gender=Neut\|NumType=Card\|Number=Sing\|POS=NUM`, `Animacy=Hum\|Case=Nom\|Number=Sing\|POS=PRON\|PronType=Prs`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Gender=Masc\|Number=Sing\|POS=NOUN`, `Abbr=Yes\|POS=ADV`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Tot`, `Definite=Def\|POS=DET\|PronType=Prs`, `Animacy=Hum\|Case=Nom\|Gender=Fem\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Neut\|POS=NOUN`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Int`, `Definite=Def\|NumType=Card\|POS=NUM`, `Mood=Imp\|POS=VERB\|VerbForm=Fin`, `Definite=Ind\|Number=Plur\|POS=NOUN`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Tot`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Tot`, `Animacy=Hum\|Case=Acc\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|Polarity=Neg\|PronType=Neg,Prs`, `Number=Plur\|POS=PRON\|Person=3\|Polarity=Neg\|PronType=Neg,Prs`, `Definite=Def\|NumType=Card\|Number=Sing\|POS=NUM`, `Gender=Masc\|NumType=Card\|Number=Sing\|POS=NUM`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `Case=Gen\|Definite=Def\|Gender=Fem\|Number=Plur\|POS=NOUN`, `Case=Gen\|Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem`, `POS=SPACE`, `Animacy=Hum\|Number=Sing\|POS=PRON\|PronType=Art,Prs`, `Mood=Imp\|POS=AUX\|VerbForm=Fin`, `Number=Plur\|POS=PRON\|Person=3\|PronType=Prs,Tot`, `Number=Plur\|POS=ADJ`, `Gender=Masc\|POS=NOUN`, `Abbr=Yes\|POS=NOUN`, `Case=Gen\|Definite=Ind\|Gender=Masc\|Number=Plur\|POS=NOUN`, `Gender=Neut\|Number=Sing\|POS=PRON\|Person=3\|PronType=Ind,Prs`, `POS=INTJ`, `Animacy=Hum\|Case=Nom\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Animacy=Hum\|Case=Acc\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Masc\|Number=Plur\|POS=NOUN`, `POS=ADJ`, `Animacy=Hum\|Case=Acc\|Gender=Fem\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Animacy=Hum\|Case=Acc\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=NOUN`, `Number=Sing\|POS=PRON\|Polarity=Neg\|PronType=Neg`, `Case=Gen\|POS=NOUN`, `Definite=Ind\|Number=Sing\|POS=ADJ`, `Case=Gen\|Gender=Masc\|POS=PROPN`, `Animacy=Hum\|Number=Plur\|POS=PRON\|PronType=Rcp`, `Case=Gen\|Definite=Ind\|Gender=Fem\|Number=Sing\|POS=NOUN`, `Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Ind,Prs`, `Definite=Ind\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Fem\|Number=Sing\|POS=NOUN`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Art`, `Case=Gen\|Definite=Def\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Int`, `NumType=Card\|Number=Sing\|POS=NUM`, `Animacy=Hum\|Case=Acc\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Animacy=Hum\|Case=Nom\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Degree=Pos\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Degree=Sup\|POS=ADJ`, `Animacy=Hum\|POS=PRON\|PronType=Int`, `POS=DET\|PronType=Ind`, `Definite=Def\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Fem\|POS=NOUN`, `Case=Gen\|Number=Plur\|POS=DET\|PronType=Dem`, `Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs,Tot`, `Case=Gen\|Definite=Ind\|Gender=Fem\|Number=Plur\|POS=NOUN`, `Gender=Neut\|Number=Sing\|POS=DET\|Polarity=Neg\|PronType=Neg`, `Number=Plur\|POS=NOUN`, `POS=PRON\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Definite=Ind\|Number=Sing\|POS=VERB\|VerbForm=Part`, `Case=Gen\|Definite=Def\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Mood=Ind\|POS=VERB\|Tense=Past\|VerbForm=Fin\|Voice=Pass`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem,Ind`, `Animacy=Hum\|POS=PRON\|Poss=Yes\|PronType=Int`, `Abbr=Yes\|POS=ADJ`, `Case=Gen\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `Abbr=Yes\|Definite=Def,Ind\|Gender=Masc\|Number=Sing\|POS=NOUN`, `Case=Gen\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Dem`, `Number=Plur\|POS=PRON\|Poss=Yes\|PronType=Rcp`, `Definite=Ind\|Degree=Pos\|POS=ADJ`, `Number=Plur\|POS=DET\|PronType=Art`, `Case=Gen\|NumType=Card\|Number=Plur\|POS=NUM`, `Abbr=Yes\|Definite=Def,Ind\|Gender=Neut\|Number=Plur,Sing\|POS=NOUN`, `Case=Gen\|Number=Plur\|POS=DET\|PronType=Tot`, `Abbr=Yes\|Definite=Def,Ind\|Gender=Masc\|Number=Plur,Sing\|POS=NOUN`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Int`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Case=Gen\|Definite=Ind\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Prs`, `Animacy=Hum\|Case=Gen,Nom\|Number=Sing\|POS=PRON\|PronType=Art,Prs`, `Definite=Def\|Degree=Pos\|Gender=Masc\|Number=Sing\|POS=ADJ`, `Animacy=Hum\|Case=Gen\|Number=Sing\|POS=PRON\|PronType=Art,Prs`, `Gender=Fem\|NumType=Card\|Number=Sing\|POS=NUM`, `Definite=Ind\|Gender=Masc\|POS=NOUN`, `Definite=Def\|Number=Plur\|POS=NOUN`, `Number=Sing\|POS=ADJ\|VerbForm=Part`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Abbr=Yes\|Gender=Masc\|POS=NOUN`, `Abbr=Yes\|Case=Gen\|POS=NOUN`, `Abbr=Yes\|Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin`, `Abbr=Yes\|Degree=Pos\|POS=ADJ`, `Case=Gen\|Gender=Fem\|POS=NOUN`, `Case=Gen\|Degree=Cmp\|POS=ADJ`, `Definite=Ind\|Degree=Pos\|Gender=Masc\|Number=Sing\|POS=ADJ`, `Gender=Masc\|Number=Sing\|POS=NOUN` |
99
  | **`parser`** | `ROOT`, `acl`, `acl:cleft`, `acl:relcl`, `advcl`, `advmod`, `amod`, `appos`, `aux`, `aux:pass`, `case`, `cc`, `ccomp`, `compound`, `compound:prt`, `conj`, `cop`, `csubj`, `dep`, `det`, `discourse`, `expl`, `flat:foreign`, `flat:name`, `iobj`, `mark`, `nmod`, `nsubj`, `nsubj:pass`, `nummod`, `obj`, `obl`, `orphan`, `parataxis`, `punct`, `xcomp` |
100
  | **`ner`** | `DRV`, `EVT`, `GPE_LOC`, `GPE_ORG`, `LOC`, `MISC`, `ORG`, `PER`, `PROD` |
101
 
 
109
  | `TOKEN_P` | 99.71 |
110
  | `TOKEN_R` | 99.53 |
111
  | `TOKEN_F` | 99.62 |
112
+ | `POS_ACC` | 96.77 |
113
+ | `MORPH_ACC` | 95.35 |
114
+ | `MORPH_MICRO_P` | 96.99 |
115
+ | `MORPH_MICRO_R` | 96.17 |
116
+ | `MORPH_MICRO_F` | 96.58 |
117
+ | `SENTS_P` | 93.25 |
118
+ | `SENTS_R` | 93.52 |
119
+ | `SENTS_F` | 93.39 |
120
+ | `DEP_UAS` | 88.29 |
121
+ | `DEP_LAS` | 84.87 |
122
+ | `LEMMA_ACC` | 96.88 |
123
+ | `TAG_ACC` | 96.77 |
124
+ | `ENTS_P` | 77.03 |
125
+ | `ENTS_R` | 73.70 |
126
+ | `ENTS_F` | 75.33 |
accuracy.json CHANGED
@@ -3,61 +3,61 @@
3
  "token_p": 0.997080292,
4
  "token_r": 0.9953256895,
5
  "token_f": 0.9962022181,
6
- "pos_acc": 0.9671340808,
7
- "morph_acc": 0.9532993525,
8
- "morph_micro_p": 0.9702239789,
9
- "morph_micro_r": 0.9619070945,
10
- "morph_micro_f": 0.9660476366,
11
  "morph_per_feat": {
12
  "Definite": {
13
- "p": 0.974126035,
14
- "r": 0.9607576273,
15
- "f": 0.9673956489
16
  },
17
  "Gender": {
18
- "p": 0.9403884796,
19
- "r": 0.9321824908,
20
- "f": 0.936267505
21
  },
22
  "Number": {
23
- "p": 0.9702808864,
24
- "r": 0.9591911495,
25
- "f": 0.9647041486
26
  },
27
  "Mood": {
28
- "p": 0.9797348011,
29
- "r": 0.9792448112,
30
- "f": 0.9794897449
31
  },
32
  "Tense": {
33
- "p": 0.9803674805,
34
- "r": 0.980861244,
35
- "f": 0.9806143001
36
  },
37
  "VerbForm": {
38
- "p": 0.9705207992,
39
- "r": 0.9657757497,
40
- "f": 0.9681424604
41
  },
42
  "Degree": {
43
- "p": 0.9571675302,
44
- "r": 0.9519065613,
45
- "f": 0.9545297968
46
  },
47
  "PronType": {
48
- "p": 0.9897937025,
49
- "r": 0.983175151,
50
- "f": 0.9864733254
51
  },
52
  "Poss": {
53
- "p": 0.9920948617,
54
  "r": 0.9920948617,
55
- "f": 0.9920948617
56
  },
57
  "Case": {
58
- "p": 0.9949776786,
59
- "r": 0.9872646733,
60
- "f": 0.9911061701
61
  },
62
  "Reflex": {
63
  "p": 1.0,
@@ -75,186 +75,181 @@
75
  "f": 1.0
76
  },
77
  "Person": {
78
- "p": 0.9895536562,
79
- "r": 0.9890840057,
80
- "f": 0.9893187752
81
  },
82
  "Animacy": {
83
- "p": 0.9982949702,
84
- "r": 0.9974446337,
85
- "f": 0.9978696208
86
  },
87
  "Voice": {
88
- "p": 0.9424460432,
89
- "r": 0.9492753623,
90
- "f": 0.9458483755
91
  },
92
  "Abbr": {
93
- "p": 0.9708029197,
94
  "r": 0.83125,
95
- "f": 0.8956228956
96
  }
97
  },
98
- "sents_p": 0.9219071106,
99
- "sents_r": 0.9310917393,
100
- "sents_f": 0.9264766625,
101
- "dep_uas": 0.8826525829,
102
- "dep_las": 0.84903125,
103
  "dep_las_per_type": {
104
  "nmod": {
105
- "p": 0.7744391026,
106
- "r": 0.7931883463,
107
- "f": 0.7837016015
108
  },
109
  "nsubj": {
110
- "p": 0.8860443334,
111
- "r": 0.8745762712,
112
- "f": 0.8802729529
113
  },
114
  "flat:name": {
115
- "p": 0.8867313916,
116
- "r": 0.8824476651,
117
- "f": 0.8845843422
118
  },
119
  "root": {
120
- "p": 0.8939267887,
121
- "r": 0.8920713989,
122
- "f": 0.8929981301
123
  },
124
  "advmod": {
125
- "p": 0.8216682646,
126
- "r": 0.8224568138,
127
- "f": 0.8220623501
128
  },
129
  "mark": {
130
- "p": 0.9113573407,
131
- "r": 0.9149054505,
132
- "f": 0.9131279489
133
  },
134
  "advcl": {
135
- "p": 0.6785079929,
136
- "r": 0.6552315609,
137
- "f": 0.6666666667
138
  },
139
  "obj": {
140
- "p": 0.8656898657,
141
- "r": 0.8796526055,
142
- "f": 0.8726153846
143
  },
144
  "case": {
145
- "p": 0.9318299637,
146
- "r": 0.9277419355,
147
- "f": 0.9297814561
148
  },
149
  "det": {
150
- "p": 0.9564393939,
151
- "r": 0.9588607595,
152
- "f": 0.9576485461
153
  },
154
  "obl": {
155
- "p": 0.7561669829,
156
- "r": 0.7212669683,
157
- "f": 0.7383047707
158
  },
159
  "aux": {
160
- "p": 0.9432234432,
161
- "r": 0.9321266968,
162
- "f": 0.9376422394
163
  },
164
  "acl:relcl": {
165
- "p": 0.7780269058,
166
- "r": 0.7815315315,
167
- "f": 0.7797752809
168
  },
169
  "iobj": {
170
- "p": 0.8024691358,
171
- "r": 0.7386363636,
172
- "f": 0.7692307692
173
  },
174
  "xcomp": {
175
- "p": 0.6777041943,
176
- "r": 0.6961451247,
177
- "f": 0.6868008949
178
  },
179
  "cc": {
180
- "p": 0.9162790698,
181
- "r": 0.9113338473,
182
- "f": 0.9137997681
183
  },
184
  "conj": {
185
- "p": 0.6964410328,
186
- "r": 0.7247639797,
187
- "f": 0.7103202847
188
  },
189
  "amod": {
190
- "p": 0.9262644729,
191
- "r": 0.920654149,
192
- "f": 0.9234507898
193
  },
194
  "nummod": {
195
- "p": 0.9143968872,
196
- "r": 0.9591836735,
197
- "f": 0.9362549801
198
  },
199
  "compound:prt": {
200
- "p": 0.803030303,
201
- "r": 0.7653429603,
202
- "f": 0.7837338262
203
  },
204
  "cop": {
205
- "p": 0.856812933,
206
- "r": 0.884386174,
207
- "f": 0.8703812317
208
  },
209
  "appos": {
210
- "p": 0.2794117647,
211
- "r": 0.19,
212
- "f": 0.2261904762
213
  },
214
  "ccomp": {
215
- "p": 0.7955390335,
216
- "r": 0.842519685,
217
- "f": 0.8183556405
218
- },
219
- "expl": {
220
- "p": 0.7128463476,
221
- "r": 0.7648648649,
222
- "f": 0.7379400261
223
  },
224
  "acl": {
225
- "p": 0.658008658,
226
- "r": 0.6129032258,
227
- "f": 0.6346555324
228
  },
229
  "csubj": {
230
- "p": 0.7230769231,
231
- "r": 0.6861313869,
232
- "f": 0.7041198502
 
 
 
 
 
233
  },
234
  "nsubj:pass": {
235
- "p": 0.862244898,
236
- "r": 0.7824074074,
237
- "f": 0.8203883495
238
  },
239
  "aux:pass": {
240
- "p": 0.9464285714,
241
- "r": 0.8833333333,
242
- "f": 0.9137931034
243
- },
244
- "parataxis": {
245
- "p": 0.8255033557,
246
- "r": 0.6542553191,
247
- "f": 0.7299703264
248
  },
249
  "acl:cleft": {
250
- "p": 0.4333333333,
251
- "r": 0.4814814815,
252
- "f": 0.4561403509
253
  },
254
  "orphan": {
255
- "p": 0.1428571429,
256
- "r": 0.0384615385,
257
- "f": 0.0606060606
258
  },
259
  "dep": {
260
  "p": 0.0,
@@ -266,20 +261,25 @@
266
  "r": 0.0,
267
  "f": 0.0
268
  },
269
- "flat:foreign": {
270
- "p": 0.2,
271
- "r": 0.1612903226,
272
- "f": 0.1785714286
273
  },
274
  "compound": {
275
- "p": 0.9285714286,
276
- "r": 0.3170731707,
277
- "f": 0.4727272727
 
 
 
 
 
278
  },
279
  "discourse": {
280
- "p": 0.7272727273,
281
- "r": 0.347826087,
282
- "f": 0.4705882353
283
  },
284
  "csubj:pass": {
285
  "p": 0.0,
@@ -287,52 +287,52 @@
287
  "f": 0.0
288
  }
289
  },
290
- "lemma_acc": 0.9686243182,
291
- "tag_acc": 0.9671340808,
292
- "ents_p": 0.7655003069,
293
- "ents_r": 0.7387440758,
294
- "ents_f": 0.7518842327,
295
  "ents_per_type": {
296
  "PER": {
297
- "p": 0.8068739771,
298
- "r": 0.8068739771,
299
- "f": 0.8068739771
300
  },
301
- "ORG": {
302
- "p": 0.7772511848,
303
- "r": 0.8118811881,
304
- "f": 0.794188862
305
  },
306
  "GPE_LOC": {
307
- "p": 0.7546468401,
308
- "r": 0.7837837838,
309
- "f": 0.7689393939
310
  },
311
- "PROD": {
312
- "p": 0.65625,
313
- "r": 0.5185185185,
314
- "f": 0.5793103448
315
- },
316
- "DRV": {
317
- "p": 0.7692307692,
318
- "r": 0.7594936709,
319
- "f": 0.7643312102
320
  },
321
  "LOC": {
322
- "p": 0.652173913,
323
- "r": 0.4128440367,
324
- "f": 0.5056179775
 
 
 
 
 
325
  },
326
  "GPE_ORG": {
327
- "p": 0.7142857143,
328
- "r": 0.5454545455,
329
- "f": 0.618556701
330
  },
331
  "EVT": {
332
- "p": 0.4,
333
  "r": 0.4444444444,
334
- "f": 0.4210526316
335
  }
336
  },
337
- "speed": 10943.0978477171
338
  }
 
3
  "token_p": 0.997080292,
4
  "token_r": 0.9953256895,
5
  "token_f": 0.9962022181,
6
+ "pos_acc": 0.9676832796,
7
+ "morph_acc": 0.9535447607,
8
+ "morph_micro_p": 0.9699474698,
9
+ "morph_micro_r": 0.9617438158,
10
+ "morph_micro_f": 0.9658282229,
11
  "morph_per_feat": {
12
  "Definite": {
13
+ "p": 0.973768983,
14
+ "r": 0.9599637065,
15
+ "f": 0.9668170655
16
  },
17
  "Gender": {
18
+ "p": 0.9396139882,
19
+ "r": 0.9327515887,
20
+ "f": 0.9361702128
21
  },
22
  "Number": {
23
+ "p": 0.9708716276,
24
+ "r": 0.9597040076,
25
+ "f": 0.9652555175
26
  },
27
  "Mood": {
28
+ "p": 0.979197995,
29
+ "r": 0.9769942486,
30
+ "f": 0.9780948805
31
  },
32
  "Tense": {
33
+ "p": 0.9801057668,
34
+ "r": 0.9801057668,
35
+ "f": 0.9801057668
36
  },
37
  "VerbForm": {
38
+ "p": 0.9670096358,
39
+ "r": 0.9649608866,
40
+ "f": 0.9659841749
41
  },
42
  "Degree": {
43
+ "p": 0.9647592463,
44
+ "r": 0.9498454139,
45
+ "f": 0.9572442444
46
  },
47
  "PronType": {
48
+ "p": 0.9887323944,
49
+ "r": 0.984253667,
50
+ "f": 0.9864879472
51
  },
52
  "Poss": {
53
+ "p": 0.996031746,
54
  "r": 0.9920948617,
55
+ "f": 0.9940594059
56
  },
57
  "Case": {
58
+ "p": 0.9933184855,
59
+ "r": 0.9878183832,
60
+ "f": 0.9905607996
61
  },
62
  "Reflex": {
63
  "p": 1.0,
 
75
  "f": 1.0
76
  },
77
  "Person": {
78
+ "p": 0.9886201991,
79
+ "r": 0.9895586141,
80
+ "f": 0.9890891841
81
  },
82
  "Animacy": {
83
+ "p": 0.996592845,
84
+ "r": 0.996592845,
85
+ "f": 0.996592845
86
  },
87
  "Voice": {
88
+ "p": 0.9361702128,
89
+ "r": 0.9565217391,
90
+ "f": 0.9462365591
91
  },
92
  "Abbr": {
93
+ "p": 0.9779411765,
94
  "r": 0.83125,
95
+ "f": 0.8986486486
96
  }
97
  },
98
+ "sents_p": 0.9325331126,
99
+ "sents_r": 0.9352428394,
100
+ "sents_f": 0.9338860104,
101
+ "dep_uas": 0.8828806301,
102
+ "dep_las": 0.8486771164,
103
  "dep_las_per_type": {
104
  "nmod": {
105
+ "p": 0.7644,
106
+ "r": 0.7841608535,
107
+ "f": 0.7741543447
108
  },
109
  "nsubj": {
110
+ "p": 0.8836848635,
111
+ "r": 0.8779661017,
112
+ "f": 0.8808162003
113
  },
114
  "flat:name": {
115
+ "p": 0.856466877,
116
+ "r": 0.8743961353,
117
+ "f": 0.8653386454
118
  },
119
  "root": {
120
+ "p": 0.8972118186,
121
+ "r": 0.8949771689,
122
+ "f": 0.8960931006
123
  },
124
  "advmod": {
125
+ "p": 0.8163950144,
126
+ "r": 0.8171785029,
127
+ "f": 0.8167865707
128
  },
129
  "mark": {
130
+ "p": 0.9122905028,
131
+ "r": 0.9082313682,
132
+ "f": 0.9102564103
133
  },
134
  "advcl": {
135
+ "p": 0.6868327402,
136
+ "r": 0.6620926244,
137
+ "f": 0.6742358079
138
  },
139
  "obj": {
140
+ "p": 0.8679588128,
141
+ "r": 0.8889578164,
142
+ "f": 0.8783328226
143
  },
144
  "case": {
145
+ "p": 0.9327817994,
146
+ "r": 0.9310967742,
147
+ "f": 0.9319385251
148
  },
149
  "det": {
150
+ "p": 0.9608091024,
151
+ "r": 0.9620253165,
152
+ "f": 0.9614168248
153
  },
154
  "obl": {
155
+ "p": 0.7551117451,
156
+ "r": 0.7185520362,
157
+ "f": 0.7363783909
158
  },
159
  "aux": {
160
+ "p": 0.9340560072,
161
+ "r": 0.9357466063,
162
+ "f": 0.9349005425
163
  },
164
  "acl:relcl": {
165
+ "p": 0.8148148148,
166
+ "r": 0.7927927928,
167
+ "f": 0.803652968
168
  },
169
  "iobj": {
170
+ "p": 0.7313432836,
171
+ "r": 0.5568181818,
172
+ "f": 0.6322580645
173
  },
174
  "xcomp": {
175
+ "p": 0.6907894737,
176
+ "r": 0.7142857143,
177
+ "f": 0.7023411371
178
  },
179
  "cc": {
180
+ "p": 0.9068322981,
181
+ "r": 0.900539707,
182
+ "f": 0.9036750484
183
  },
184
  "conj": {
185
+ "p": 0.7009873061,
186
+ "r": 0.721859114,
187
+ "f": 0.7112701252
188
  },
189
  "amod": {
190
+ "p": 0.9233110164,
191
+ "r": 0.9188370684,
192
+ "f": 0.9210686096
193
  },
194
  "nummod": {
195
+ "p": 0.8996138996,
196
+ "r": 0.9510204082,
197
+ "f": 0.9246031746
198
  },
199
  "compound:prt": {
200
+ "p": 0.8429118774,
201
+ "r": 0.7942238267,
202
+ "f": 0.8178438662
203
  },
204
  "cop": {
205
+ "p": 0.858974359,
206
+ "r": 0.8784266985,
207
+ "f": 0.8685916323
208
  },
209
  "appos": {
210
+ "p": 0.4242424242,
211
+ "r": 0.28,
212
+ "f": 0.3373493976
213
  },
214
  "ccomp": {
215
+ "p": 0.8028673835,
216
+ "r": 0.8818897638,
217
+ "f": 0.8405253283
 
 
 
 
 
218
  },
219
  "acl": {
220
+ "p": 0.6394849785,
221
+ "r": 0.6008064516,
222
+ "f": 0.6195426195
223
  },
224
  "csubj": {
225
+ "p": 0.7307692308,
226
+ "r": 0.6934306569,
227
+ "f": 0.7116104869
228
+ },
229
+ "expl": {
230
+ "p": 0.694235589,
231
+ "r": 0.7486486486,
232
+ "f": 0.7204161248
233
  },
234
  "nsubj:pass": {
235
+ "p": 0.8316831683,
236
+ "r": 0.7777777778,
237
+ "f": 0.8038277512
238
  },
239
  "aux:pass": {
240
+ "p": 0.9203539823,
241
+ "r": 0.8666666667,
242
+ "f": 0.8927038627
 
 
 
 
 
243
  },
244
  "acl:cleft": {
245
+ "p": 0.4615384615,
246
+ "r": 0.4444444444,
247
+ "f": 0.4528301887
248
  },
249
  "orphan": {
250
+ "p": 0.0,
251
+ "r": 0.0,
252
+ "f": 0.0
253
  },
254
  "dep": {
255
  "p": 0.0,
 
261
  "r": 0.0,
262
  "f": 0.0
263
  },
264
+ "parataxis": {
265
+ "p": 0.8243243243,
266
+ "r": 0.6489361702,
267
+ "f": 0.7261904762
268
  },
269
  "compound": {
270
+ "p": 0.9,
271
+ "r": 0.2195121951,
272
+ "f": 0.3529411765
273
+ },
274
+ "flat:foreign": {
275
+ "p": 0.3888888889,
276
+ "r": 0.2258064516,
277
+ "f": 0.2857142857
278
  },
279
  "discourse": {
280
+ "p": 0.6923076923,
281
+ "r": 0.3913043478,
282
+ "f": 0.5
283
  },
284
  "csubj:pass": {
285
  "p": 0.0,
 
287
  "f": 0.0
288
  }
289
  },
290
+ "lemma_acc": 0.9687620517,
291
+ "tag_acc": 0.9676832796,
292
+ "ents_p": 0.7702786378,
293
+ "ents_r": 0.7369668246,
294
+ "ents_f": 0.753254617,
295
  "ents_per_type": {
296
  "PER": {
297
+ "p": 0.8344262295,
298
+ "r": 0.8330605565,
299
+ "f": 0.8337428337
300
  },
301
+ "PROD": {
302
+ "p": 0.6240601504,
303
+ "r": 0.512345679,
304
+ "f": 0.5627118644
305
  },
306
  "GPE_LOC": {
307
+ "p": 0.7791164659,
308
+ "r": 0.749034749,
309
+ "f": 0.7637795276
310
  },
311
+ "ORG": {
312
+ "p": 0.7772397094,
313
+ "r": 0.7945544554,
314
+ "f": 0.7858017136
 
 
 
 
 
315
  },
316
  "LOC": {
317
+ "p": 0.5208333333,
318
+ "r": 0.4587155963,
319
+ "f": 0.487804878
320
+ },
321
+ "DRV": {
322
+ "p": 0.7866666667,
323
+ "r": 0.746835443,
324
+ "f": 0.7662337662
325
  },
326
  "GPE_ORG": {
327
+ "p": 0.7058823529,
328
+ "r": 0.4363636364,
329
+ "f": 0.5393258427
330
  },
331
  "EVT": {
332
+ "p": 0.8,
333
  "r": 0.4444444444,
334
+ "f": 0.5714285714
335
  }
336
  },
337
+ "speed": 13912.0236342851
338
  }
lemmatizer/cfg CHANGED
@@ -37,213 +37,214 @@
37
  67,
38
  69,
39
  70,
40
- 72,
41
- 74,
42
- 77,
43
- 80,
44
- 82,
45
- 86,
46
- 88,
47
- 92,
48
- 94,
49
  95,
50
  96,
51
- 98,
52
- 100,
53
- 102,
54
- 106,
55
- 108,
56
- 111,
57
  112,
58
- 114,
59
- 116,
60
- 118,
61
- 120,
62
- 124,
63
- 126,
64
- 128,
65
- 130,
66
- 133,
67
- 135,
68
  136,
69
  137,
70
  138,
71
- 140,
72
- 142,
73
- 144,
74
- 146,
75
- 148,
76
- 150,
77
- 152,
78
  153,
79
- 156,
80
- 159,
81
  160,
82
- 162,
83
  163,
84
- 165,
85
- 167,
86
- 169,
87
- 171,
88
- 173,
89
  174,
90
- 176,
91
- 178,
92
  179,
93
  180,
94
  181,
95
- 183,
96
  184,
97
- 186,
98
  187,
99
  188,
100
  189,
101
- 192,
102
  193,
103
- 195,
104
- 197,
105
  198,
106
- 201,
107
- 203,
108
- 205,
109
- 208,
110
- 211,
111
  212,
112
  213,
113
  214,
114
- 217,
115
- 219,
116
- 221,
117
  222,
118
  223,
119
- 225,
120
  226,
121
  228,
122
- 229,
123
- 232,
124
- 233,
125
  236,
126
- 239,
127
- 241,
128
- 242,
129
  243,
130
  244,
131
  247,
132
  250,
133
  252,
134
  253,
135
- 256,
 
136
  258,
137
- 259,
138
- 260,
139
  263,
140
  264,
141
- 266,
142
  267,
143
- 268,
144
  269,
145
- 270,
146
  272,
147
- 274,
148
  276,
149
- 278,
150
  279,
 
151
  281,
 
 
152
  285,
153
- 287,
154
  289,
155
- 291,
156
  295,
 
157
  297,
158
- 298,
159
- 299,
160
  302,
161
- 303,
162
- 304,
163
- 307,
164
  308,
165
  309,
166
  311,
167
- 312,
168
- 314,
169
- 46,
170
- 316,
171
- 318,
172
  319,
173
  321,
174
  322,
175
- 323,
176
  324,
177
  326,
178
- 327,
179
  328,
180
- 330,
181
  331,
 
182
  333,
183
- 335,
184
  336,
185
  337,
186
  338,
187
  340,
188
  341,
189
  342,
190
- 343,
191
  345,
192
  347,
193
- 348,
194
  349,
 
195
  351,
196
- 353,
 
 
197
  356,
198
- 358,
199
  359,
200
- 360,
201
  361,
202
  362,
203
- 364,
204
  365,
205
- 368,
206
- 369,
207
- 371,
208
  373,
 
 
209
  376,
210
  378,
211
  379,
212
  382,
 
213
  385,
214
  387,
215
- 389,
216
- 391,
217
- 393,
218
  395,
219
- 397,
220
- 399,
221
  401,
222
  403,
223
- 405,
 
224
  407,
225
- 409,
226
- 411,
227
- 413,
228
  414,
229
- 415,
230
- 417,
231
  418,
232
  419,
233
- 421,
234
  422,
 
235
  424,
236
- 426,
237
- 429,
238
- 431,
 
239
  432,
240
- 434,
241
  436,
242
- 437,
243
  439,
244
  440,
245
  442,
246
- 443,
247
  444,
248
  447,
249
  449,
@@ -253,14 +254,13 @@
253
  453,
254
  456,
255
  457,
256
- 458,
257
  460,
258
- 461,
259
- 463,
260
  466,
261
  467,
262
- 468,
263
- 470,
264
  471,
265
  473,
266
  476,
@@ -277,302 +277,315 @@
277
  490,
278
  491,
279
  492,
 
280
  494,
281
  496,
282
  498,
283
- 499,
284
  501,
285
- 502,
286
  503,
287
  504,
288
- 507,
289
- 508,
 
290
  510,
291
- 511,
292
- 515,
293
- 519,
294
  521,
295
  523,
296
  525,
297
  527,
298
- 528,
299
  529,
300
  530,
301
  531,
 
302
  533,
303
- 534,
304
  536,
305
- 537,
306
  538,
 
307
  540,
308
  541,
309
- 543,
 
310
  545,
311
- 546,
312
- 548,
313
- 552,
314
  553,
315
- 554,
316
- 555,
317
- 556,
318
  558,
319
  559,
320
  560,
321
  562,
322
- 563,
323
  564,
 
324
  566,
325
  568,
326
  569,
327
- 570,
328
  572,
329
  574,
330
  576,
331
- 579,
332
- 580,
333
  581,
 
334
  583,
335
- 584,
336
  586,
337
- 587,
338
  589,
339
- 592,
340
  594,
341
  595,
342
- 596,
343
  598,
344
- 600,
345
- 602,
346
- 604,
 
347
  607,
348
- 608,
349
- 611,
350
- 612,
351
  613,
352
- 616,
 
353
  618,
354
  620,
355
- 621,
356
  623,
357
- 624,
358
  625,
359
  626,
360
  627,
361
- 628,
362
  629,
 
363
  631,
364
  632,
 
365
  635,
366
- 636,
367
- 639,
368
  640,
369
  642,
370
- 644,
371
  646,
372
- 650,
 
373
  652,
374
- 653,
375
  654,
376
  655,
377
  656,
378
  657,
 
379
  659,
380
- 660,
381
  662,
382
- 663,
383
  664,
 
384
  666,
385
  668,
386
  670,
387
  672,
388
- 673,
389
  674,
390
  675,
 
391
  677,
392
  679,
393
- 680,
394
  682,
395
  683,
396
- 685,
397
  686,
398
  687,
399
- 688,
400
  689,
 
401
  691,
 
 
402
  694,
403
  695,
404
- 696,
405
  697,
406
- 698,
407
  700,
408
  701,
 
409
  703,
410
  704,
411
  705,
412
- 706,
413
  708,
414
  710,
415
  711,
416
  712,
417
- 713,
418
- 715,
419
  716,
420
  717,
421
  718,
422
- 719,
423
  720,
424
  721,
425
- 722,
426
  724,
427
  725,
 
428
  727,
429
  728,
430
  729,
431
  730,
 
432
  733,
433
  735,
434
- 737,
435
  738,
436
  740,
437
  742,
438
  743,
439
  744,
440
- 745,
441
  746,
442
- 747,
443
  749,
444
  750,
445
  751,
446
  752,
 
447
  754,
448
  756,
449
  757,
450
  758,
451
  760,
452
- 761,
453
  762,
454
  763,
455
  764,
456
- 765,
457
  766,
458
- 767,
459
  768,
460
  769,
461
  770,
 
 
462
  773,
463
  774,
464
  775,
465
  776,
466
  777,
467
  778,
468
- 779,
469
- 780,
470
  781,
471
  783,
472
  784,
 
473
  786,
 
 
474
  789,
 
475
  792,
476
- 793,
477
  795,
478
- 796,
479
  798,
480
- 799,
481
- 800,
482
  801,
483
- 803,
484
  804,
 
 
 
 
485
  808,
486
  809,
487
  811,
488
  812,
489
  813,
490
- 814,
491
- 816,
492
  818,
493
  819,
494
- 820,
495
- 113,
496
- 41,
497
  821,
498
  822,
499
  823,
500
- 825,
501
- 827,
502
  828,
 
 
503
  831,
504
  832,
505
  833,
506
- 834,
507
  837,
508
  838,
509
  839,
510
- 840,
511
  842,
 
512
  844,
513
  845,
514
  847,
515
- 848,
516
  850,
517
  851,
 
518
  853,
519
- 855,
520
  856,
521
- 857,
522
  858,
 
523
  860,
524
- 861,
525
  862,
526
  863,
 
527
  865,
528
- 868,
 
 
529
  872,
530
  873,
531
- 875,
532
  876,
533
  877,
534
- 880,
535
- 881,
536
  882,
537
- 883,
538
- 885,
539
- 887,
540
  886,
 
541
  888,
542
  889,
543
  890,
 
544
  892,
545
- 894,
546
  895,
 
547
  897,
548
  898,
549
  899,
 
550
  901,
551
  902,
552
- 904,
553
- 906,
 
554
  908,
555
- 910,
 
556
  912,
557
  913,
558
  915,
559
- 919,
 
560
  920,
561
  922,
562
- 923,
563
  924,
564
- 925,
565
  926,
566
- 927,
567
  928,
568
- 930,
569
- 932,
570
- 933,
571
- 934,
572
  937,
 
573
  939,
 
574
  941,
575
  942,
576
- 943
 
 
 
 
 
 
 
 
 
 
577
  ]
578
  }
 
37
  67,
38
  69,
39
  70,
40
+ 71,
41
+ 73,
42
+ 75,
43
+ 78,
44
+ 81,
45
+ 83,
46
+ 87,
47
+ 89,
48
+ 93,
49
  95,
50
  96,
51
+ 97,
52
+ 99,
53
+ 101,
54
+ 103,
55
+ 107,
56
+ 109,
57
  112,
58
+ 113,
59
+ 115,
60
+ 117,
61
+ 119,
62
+ 121,
63
+ 125,
64
+ 127,
65
+ 129,
66
+ 131,
67
+ 134,
68
  136,
69
  137,
70
  138,
71
+ 139,
72
+ 141,
73
+ 143,
74
+ 145,
75
+ 147,
76
+ 149,
77
+ 151,
78
  153,
79
+ 154,
80
+ 157,
81
  160,
82
+ 161,
83
  163,
84
+ 164,
85
+ 166,
86
+ 168,
87
+ 170,
88
+ 172,
89
  174,
90
+ 175,
91
+ 177,
92
  179,
93
  180,
94
  181,
95
+ 182,
96
  184,
97
+ 185,
98
  187,
99
  188,
100
  189,
101
+ 190,
102
  193,
103
+ 194,
104
+ 196,
105
  198,
106
+ 199,
107
+ 202,
108
+ 204,
109
+ 206,
110
+ 209,
111
  212,
112
  213,
113
  214,
114
+ 215,
115
+ 218,
116
+ 220,
117
  222,
118
  223,
119
+ 224,
120
  226,
121
  228,
122
+ 230,
123
+ 234,
 
124
  236,
125
+ 237,
126
+ 238,
127
+ 240,
128
  243,
129
  244,
130
  247,
131
  250,
132
  252,
133
  253,
134
+ 254,
135
+ 255,
136
  258,
137
+ 261,
 
138
  263,
139
  264,
 
140
  267,
 
141
  269,
142
+ 271,
143
  272,
144
+ 273,
145
  276,
146
+ 277,
147
  279,
148
+ 280,
149
  281,
150
+ 282,
151
+ 283,
152
  285,
 
153
  289,
154
+ 293,
155
  295,
156
+ 296,
157
  297,
158
+ 300,
159
+ 301,
160
  302,
161
+ 305,
162
+ 306,
163
+ 46,
164
  308,
165
  309,
166
  311,
167
+ 313,
168
+ 315,
169
+ 317,
 
 
170
  319,
171
  321,
172
  322,
 
173
  324,
174
  326,
 
175
  328,
176
+ 329,
177
  331,
178
+ 332,
179
  333,
180
+ 334,
181
  336,
182
  337,
183
  338,
184
  340,
185
  341,
186
  342,
187
+ 344,
188
  345,
189
  347,
 
190
  349,
191
+ 350,
192
  351,
193
+ 352,
194
+ 354,
195
+ 355,
196
  356,
197
+ 357,
198
  359,
 
199
  361,
200
  362,
201
+ 363,
202
  365,
203
+ 367,
204
+ 370,
205
+ 372,
206
  373,
207
+ 374,
208
+ 375,
209
  376,
210
  378,
211
  379,
212
  382,
213
+ 383,
214
  385,
215
  387,
216
+ 390,
217
+ 392,
218
+ 394,
219
  395,
220
+ 398,
 
221
  401,
222
  403,
223
+ 404,
224
+ 406,
225
  407,
226
+ 408,
227
+ 410,
228
+ 412,
229
  414,
230
+ 416,
 
231
  418,
232
  419,
233
+ 420,
234
  422,
235
+ 423,
236
  424,
237
+ 425,
238
+ 427,
239
+ 428,
240
+ 430,
241
  432,
242
+ 435,
243
  436,
244
+ 438,
245
  439,
246
  440,
247
  442,
 
248
  444,
249
  447,
250
  449,
 
254
  453,
255
  456,
256
  457,
257
+ 459,
258
  460,
259
+ 462,
260
+ 465,
261
  466,
262
  467,
263
+ 469,
 
264
  471,
265
  473,
266
  476,
 
277
  490,
278
  491,
279
  492,
280
+ 493,
281
  494,
282
  496,
283
  498,
284
+ 500,
285
  501,
 
286
  503,
287
  504,
288
+ 505,
289
+ 506,
290
+ 509,
291
  510,
292
+ 512,
293
+ 513,
294
+ 517,
295
  521,
296
  523,
297
  525,
298
  527,
 
299
  529,
300
  530,
301
  531,
302
+ 532,
303
  533,
304
+ 535,
305
  536,
 
306
  538,
307
+ 539,
308
  540,
309
  541,
310
+ 542,
311
+ 544,
312
  545,
313
+ 547,
314
+ 549,
315
+ 551,
316
  553,
317
+ 557,
 
 
318
  558,
319
  559,
320
  560,
321
  562,
 
322
  564,
323
+ 565,
324
  566,
325
  568,
326
  569,
327
+ 571,
328
  572,
329
  574,
330
  576,
331
+ 578,
 
332
  581,
333
+ 582,
334
  583,
335
+ 585,
336
  586,
337
+ 588,
338
  589,
339
+ 591,
340
  594,
341
  595,
342
+ 597,
343
  598,
344
+ 599,
345
+ 601,
346
+ 603,
347
+ 605,
348
  607,
349
+ 610,
 
 
350
  613,
351
+ 614,
352
+ 617,
353
  618,
354
  620,
355
+ 622,
356
  623,
 
357
  625,
358
  626,
359
  627,
 
360
  629,
361
+ 630,
362
  631,
363
  632,
364
+ 634,
365
  635,
366
+ 638,
 
367
  640,
368
  642,
369
+ 645,
370
  646,
371
+ 647,
372
+ 651,
373
  652,
 
374
  654,
375
  655,
376
  656,
377
  657,
378
+ 658,
379
  659,
380
+ 661,
381
  662,
 
382
  664,
383
+ 665,
384
  666,
385
  668,
386
  670,
387
  672,
 
388
  674,
389
  675,
390
+ 676,
391
  677,
392
  679,
393
+ 681,
394
  682,
395
  683,
396
+ 684,
397
  686,
398
  687,
 
399
  689,
400
+ 690,
401
  691,
402
+ 692,
403
+ 693,
404
  694,
405
  695,
 
406
  697,
 
407
  700,
408
  701,
409
+ 702,
410
  703,
411
  704,
412
  705,
413
+ 707,
414
  708,
415
  710,
416
  711,
417
  712,
418
+ 714,
 
419
  716,
420
  717,
421
  718,
 
422
  720,
423
  721,
424
+ 723,
425
  724,
426
  725,
427
+ 726,
428
  727,
429
  728,
430
  729,
431
  730,
432
+ 732,
433
  733,
434
  735,
 
435
  738,
436
  740,
437
  742,
438
  743,
439
  744,
 
440
  746,
441
+ 748,
442
  749,
443
  750,
444
  751,
445
  752,
446
+ 753,
447
  754,
448
  756,
449
  757,
450
  758,
451
  760,
 
452
  762,
453
  763,
454
  764,
 
455
  766,
 
456
  768,
457
  769,
458
  770,
459
+ 771,
460
+ 772,
461
  773,
462
  774,
463
  775,
464
  776,
465
  777,
466
  778,
 
 
467
  781,
468
  783,
469
  784,
470
+ 785,
471
  786,
472
+ 787,
473
+ 788,
474
  789,
475
+ 791,
476
  792,
477
+ 794,
478
  795,
 
479
  798,
 
 
480
  801,
481
+ 802,
482
  804,
483
+ 805,
484
+ 807,
485
+ 391,
486
+ 232,
487
  808,
488
  809,
489
  811,
490
  812,
491
  813,
492
+ 817,
 
493
  818,
494
  819,
 
 
 
495
  821,
496
  822,
497
  823,
498
+ 824,
499
+ 826,
500
  828,
501
+ 829,
502
+ 830,
503
  831,
504
  832,
505
  833,
506
+ 835,
507
  837,
508
  838,
509
  839,
 
510
  842,
511
+ 843,
512
  844,
513
  845,
514
  847,
 
515
  850,
516
  851,
517
+ 852,
518
  853,
519
+ 854,
520
  856,
 
521
  858,
522
+ 859,
523
  860,
 
524
  862,
525
  863,
526
+ 864,
527
  865,
528
+ 867,
529
+ 869,
530
+ 870,
531
  872,
532
  873,
533
+ 874,
534
  876,
535
  877,
536
+ 879,
 
537
  882,
 
 
 
538
  886,
539
+ 887,
540
  888,
541
  889,
542
  890,
543
+ 891,
544
  892,
 
545
  895,
546
+ 896,
547
  897,
548
  898,
549
  899,
550
+ 900,
551
  901,
552
  902,
553
+ 903,
554
+ 905,
555
+ 907,
556
  908,
557
+ 909,
558
+ 911,
559
  912,
560
  913,
561
  915,
562
+ 916,
563
+ 918,
564
  920,
565
  922,
 
566
  924,
 
567
  926,
 
568
  928,
569
+ 927,
570
+ 929,
571
+ 931,
572
+ 935,
573
  937,
574
+ 938,
575
  939,
576
+ 940,
577
  941,
578
  942,
579
+ 943,
580
+ 944,
581
+ 946,
582
+ 948,
583
+ 949,
584
+ 952,
585
+ 953,
586
+ 955,
587
+ 312,
588
+ 956,
589
+ 957
590
  ]
591
  }
lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c065668d270c91477bcc582e8d595aa3636a1d25696254eb09bd139e38a3e3fb
3
- size 223154
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4265c1162d2f46699a1c037c3659cc925d747f2e250df27f372d95aa1672dae5
3
+ size 228198
lemmatizer/trees CHANGED
Binary files a/lemmatizer/trees and b/lemmatizer/trees differ
 
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"nb",
3
  "name":"core_news_sm",
4
- "version":"3.3.0",
5
  "description":"Norwegian (Bokm\u00e5l) pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
- "spacy_version":">=3.3.0.dev0,<3.4.0",
11
- "spacy_git_version":"849bef2de",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -142,6 +142,7 @@
142
  "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Dem",
143
  "Case=Gen|Definite=Def|Gender=Fem|Number=Plur|POS=NOUN",
144
  "Case=Gen|Gender=Neut|Number=Sing|POS=DET|PronType=Dem",
 
145
  "Animacy=Hum|Number=Sing|POS=PRON|PronType=Art,Prs",
146
  "Mood=Imp|POS=AUX|VerbForm=Fin",
147
  "Number=Plur|POS=PRON|Person=3|PronType=Prs,Tot",
@@ -302,61 +303,61 @@
302
  "token_p":0.997080292,
303
  "token_r":0.9953256895,
304
  "token_f":0.9962022181,
305
- "pos_acc":0.9671340808,
306
- "morph_acc":0.9532993525,
307
- "morph_micro_p":0.9702239789,
308
- "morph_micro_r":0.9619070945,
309
- "morph_micro_f":0.9660476366,
310
  "morph_per_feat":{
311
  "Definite":{
312
- "p":0.974126035,
313
- "r":0.9607576273,
314
- "f":0.9673956489
315
  },
316
  "Gender":{
317
- "p":0.9403884796,
318
- "r":0.9321824908,
319
- "f":0.936267505
320
  },
321
  "Number":{
322
- "p":0.9702808864,
323
- "r":0.9591911495,
324
- "f":0.9647041486
325
  },
326
  "Mood":{
327
- "p":0.9797348011,
328
- "r":0.9792448112,
329
- "f":0.9794897449
330
  },
331
  "Tense":{
332
- "p":0.9803674805,
333
- "r":0.980861244,
334
- "f":0.9806143001
335
  },
336
  "VerbForm":{
337
- "p":0.9705207992,
338
- "r":0.9657757497,
339
- "f":0.9681424604
340
  },
341
  "Degree":{
342
- "p":0.9571675302,
343
- "r":0.9519065613,
344
- "f":0.9545297968
345
  },
346
  "PronType":{
347
- "p":0.9897937025,
348
- "r":0.983175151,
349
- "f":0.9864733254
350
  },
351
  "Poss":{
352
- "p":0.9920948617,
353
  "r":0.9920948617,
354
- "f":0.9920948617
355
  },
356
  "Case":{
357
- "p":0.9949776786,
358
- "r":0.9872646733,
359
- "f":0.9911061701
360
  },
361
  "Reflex":{
362
  "p":1.0,
@@ -374,186 +375,181 @@
374
  "f":1.0
375
  },
376
  "Person":{
377
- "p":0.9895536562,
378
- "r":0.9890840057,
379
- "f":0.9893187752
380
  },
381
  "Animacy":{
382
- "p":0.9982949702,
383
- "r":0.9974446337,
384
- "f":0.9978696208
385
  },
386
  "Voice":{
387
- "p":0.9424460432,
388
- "r":0.9492753623,
389
- "f":0.9458483755
390
  },
391
  "Abbr":{
392
- "p":0.9708029197,
393
  "r":0.83125,
394
- "f":0.8956228956
395
  }
396
  },
397
- "sents_p":0.9219071106,
398
- "sents_r":0.9310917393,
399
- "sents_f":0.9264766625,
400
- "dep_uas":0.8826525829,
401
- "dep_las":0.84903125,
402
  "dep_las_per_type":{
403
  "nmod":{
404
- "p":0.7744391026,
405
- "r":0.7931883463,
406
- "f":0.7837016015
407
  },
408
  "nsubj":{
409
- "p":0.8860443334,
410
- "r":0.8745762712,
411
- "f":0.8802729529
412
  },
413
  "flat:name":{
414
- "p":0.8867313916,
415
- "r":0.8824476651,
416
- "f":0.8845843422
417
  },
418
  "root":{
419
- "p":0.8939267887,
420
- "r":0.8920713989,
421
- "f":0.8929981301
422
  },
423
  "advmod":{
424
- "p":0.8216682646,
425
- "r":0.8224568138,
426
- "f":0.8220623501
427
  },
428
  "mark":{
429
- "p":0.9113573407,
430
- "r":0.9149054505,
431
- "f":0.9131279489
432
  },
433
  "advcl":{
434
- "p":0.6785079929,
435
- "r":0.6552315609,
436
- "f":0.6666666667
437
  },
438
  "obj":{
439
- "p":0.8656898657,
440
- "r":0.8796526055,
441
- "f":0.8726153846
442
  },
443
  "case":{
444
- "p":0.9318299637,
445
- "r":0.9277419355,
446
- "f":0.9297814561
447
  },
448
  "det":{
449
- "p":0.9564393939,
450
- "r":0.9588607595,
451
- "f":0.9576485461
452
  },
453
  "obl":{
454
- "p":0.7561669829,
455
- "r":0.7212669683,
456
- "f":0.7383047707
457
  },
458
  "aux":{
459
- "p":0.9432234432,
460
- "r":0.9321266968,
461
- "f":0.9376422394
462
  },
463
  "acl:relcl":{
464
- "p":0.7780269058,
465
- "r":0.7815315315,
466
- "f":0.7797752809
467
  },
468
  "iobj":{
469
- "p":0.8024691358,
470
- "r":0.7386363636,
471
- "f":0.7692307692
472
  },
473
  "xcomp":{
474
- "p":0.6777041943,
475
- "r":0.6961451247,
476
- "f":0.6868008949
477
  },
478
  "cc":{
479
- "p":0.9162790698,
480
- "r":0.9113338473,
481
- "f":0.9137997681
482
  },
483
  "conj":{
484
- "p":0.6964410328,
485
- "r":0.7247639797,
486
- "f":0.7103202847
487
  },
488
  "amod":{
489
- "p":0.9262644729,
490
- "r":0.920654149,
491
- "f":0.9234507898
492
  },
493
  "nummod":{
494
- "p":0.9143968872,
495
- "r":0.9591836735,
496
- "f":0.9362549801
497
  },
498
  "compound:prt":{
499
- "p":0.803030303,
500
- "r":0.7653429603,
501
- "f":0.7837338262
502
  },
503
  "cop":{
504
- "p":0.856812933,
505
- "r":0.884386174,
506
- "f":0.8703812317
507
  },
508
  "appos":{
509
- "p":0.2794117647,
510
- "r":0.19,
511
- "f":0.2261904762
512
  },
513
  "ccomp":{
514
- "p":0.7955390335,
515
- "r":0.842519685,
516
- "f":0.8183556405
517
- },
518
- "expl":{
519
- "p":0.7128463476,
520
- "r":0.7648648649,
521
- "f":0.7379400261
522
  },
523
  "acl":{
524
- "p":0.658008658,
525
- "r":0.6129032258,
526
- "f":0.6346555324
527
  },
528
  "csubj":{
529
- "p":0.7230769231,
530
- "r":0.6861313869,
531
- "f":0.7041198502
 
 
 
 
 
532
  },
533
  "nsubj:pass":{
534
- "p":0.862244898,
535
- "r":0.7824074074,
536
- "f":0.8203883495
537
  },
538
  "aux:pass":{
539
- "p":0.9464285714,
540
- "r":0.8833333333,
541
- "f":0.9137931034
542
- },
543
- "parataxis":{
544
- "p":0.8255033557,
545
- "r":0.6542553191,
546
- "f":0.7299703264
547
  },
548
  "acl:cleft":{
549
- "p":0.4333333333,
550
- "r":0.4814814815,
551
- "f":0.4561403509
552
  },
553
  "orphan":{
554
- "p":0.1428571429,
555
- "r":0.0384615385,
556
- "f":0.0606060606
557
  },
558
  "dep":{
559
  "p":0.0,
@@ -565,20 +561,25 @@
565
  "r":0.0,
566
  "f":0.0
567
  },
568
- "flat:foreign":{
569
- "p":0.2,
570
- "r":0.1612903226,
571
- "f":0.1785714286
572
  },
573
  "compound":{
574
- "p":0.9285714286,
575
- "r":0.3170731707,
576
- "f":0.4727272727
 
 
 
 
 
577
  },
578
  "discourse":{
579
- "p":0.7272727273,
580
- "r":0.347826087,
581
- "f":0.4705882353
582
  },
583
  "csubj:pass":{
584
  "p":0.0,
@@ -586,54 +587,54 @@
586
  "f":0.0
587
  }
588
  },
589
- "lemma_acc":0.9686243182,
590
- "tag_acc":0.9671340808,
591
- "ents_p":0.7655003069,
592
- "ents_r":0.7387440758,
593
- "ents_f":0.7518842327,
594
  "ents_per_type":{
595
  "PER":{
596
- "p":0.8068739771,
597
- "r":0.8068739771,
598
- "f":0.8068739771
599
  },
600
- "ORG":{
601
- "p":0.7772511848,
602
- "r":0.8118811881,
603
- "f":0.794188862
604
  },
605
  "GPE_LOC":{
606
- "p":0.7546468401,
607
- "r":0.7837837838,
608
- "f":0.7689393939
609
  },
610
- "PROD":{
611
- "p":0.65625,
612
- "r":0.5185185185,
613
- "f":0.5793103448
614
- },
615
- "DRV":{
616
- "p":0.7692307692,
617
- "r":0.7594936709,
618
- "f":0.7643312102
619
  },
620
  "LOC":{
621
- "p":0.652173913,
622
- "r":0.4128440367,
623
- "f":0.5056179775
 
 
 
 
 
624
  },
625
  "GPE_ORG":{
626
- "p":0.7142857143,
627
- "r":0.5454545455,
628
- "f":0.618556701
629
  },
630
  "EVT":{
631
- "p":0.4,
632
  "r":0.4444444444,
633
- "f":0.4210526316
634
  }
635
  },
636
- "speed":10943.0978477171
637
  },
638
  "sources":[
639
  {
 
1
  {
2
  "lang":"nb",
3
  "name":"core_news_sm",
4
+ "version":"3.4.0",
5
  "description":"Norwegian (Bokm\u00e5l) pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
+ "spacy_version":">=3.4.0,<3.5.0",
11
+ "spacy_git_version":"dd038b536",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
142
  "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Dem",
143
  "Case=Gen|Definite=Def|Gender=Fem|Number=Plur|POS=NOUN",
144
  "Case=Gen|Gender=Neut|Number=Sing|POS=DET|PronType=Dem",
145
+ "POS=SPACE",
146
  "Animacy=Hum|Number=Sing|POS=PRON|PronType=Art,Prs",
147
  "Mood=Imp|POS=AUX|VerbForm=Fin",
148
  "Number=Plur|POS=PRON|Person=3|PronType=Prs,Tot",
 
303
  "token_p":0.997080292,
304
  "token_r":0.9953256895,
305
  "token_f":0.9962022181,
306
+ "pos_acc":0.9676832796,
307
+ "morph_acc":0.9535447607,
308
+ "morph_micro_p":0.9699474698,
309
+ "morph_micro_r":0.9617438158,
310
+ "morph_micro_f":0.9658282229,
311
  "morph_per_feat":{
312
  "Definite":{
313
+ "p":0.973768983,
314
+ "r":0.9599637065,
315
+ "f":0.9668170655
316
  },
317
  "Gender":{
318
+ "p":0.9396139882,
319
+ "r":0.9327515887,
320
+ "f":0.9361702128
321
  },
322
  "Number":{
323
+ "p":0.9708716276,
324
+ "r":0.9597040076,
325
+ "f":0.9652555175
326
  },
327
  "Mood":{
328
+ "p":0.979197995,
329
+ "r":0.9769942486,
330
+ "f":0.9780948805
331
  },
332
  "Tense":{
333
+ "p":0.9801057668,
334
+ "r":0.9801057668,
335
+ "f":0.9801057668
336
  },
337
  "VerbForm":{
338
+ "p":0.9670096358,
339
+ "r":0.9649608866,
340
+ "f":0.9659841749
341
  },
342
  "Degree":{
343
+ "p":0.9647592463,
344
+ "r":0.9498454139,
345
+ "f":0.9572442444
346
  },
347
  "PronType":{
348
+ "p":0.9887323944,
349
+ "r":0.984253667,
350
+ "f":0.9864879472
351
  },
352
  "Poss":{
353
+ "p":0.996031746,
354
  "r":0.9920948617,
355
+ "f":0.9940594059
356
  },
357
  "Case":{
358
+ "p":0.9933184855,
359
+ "r":0.9878183832,
360
+ "f":0.9905607996
361
  },
362
  "Reflex":{
363
  "p":1.0,
 
375
  "f":1.0
376
  },
377
  "Person":{
378
+ "p":0.9886201991,
379
+ "r":0.9895586141,
380
+ "f":0.9890891841
381
  },
382
  "Animacy":{
383
+ "p":0.996592845,
384
+ "r":0.996592845,
385
+ "f":0.996592845
386
  },
387
  "Voice":{
388
+ "p":0.9361702128,
389
+ "r":0.9565217391,
390
+ "f":0.9462365591
391
  },
392
  "Abbr":{
393
+ "p":0.9779411765,
394
  "r":0.83125,
395
+ "f":0.8986486486
396
  }
397
  },
398
+ "sents_p":0.9325331126,
399
+ "sents_r":0.9352428394,
400
+ "sents_f":0.9338860104,
401
+ "dep_uas":0.8828806301,
402
+ "dep_las":0.8486771164,
403
  "dep_las_per_type":{
404
  "nmod":{
405
+ "p":0.7644,
406
+ "r":0.7841608535,
407
+ "f":0.7741543447
408
  },
409
  "nsubj":{
410
+ "p":0.8836848635,
411
+ "r":0.8779661017,
412
+ "f":0.8808162003
413
  },
414
  "flat:name":{
415
+ "p":0.856466877,
416
+ "r":0.8743961353,
417
+ "f":0.8653386454
418
  },
419
  "root":{
420
+ "p":0.8972118186,
421
+ "r":0.8949771689,
422
+ "f":0.8960931006
423
  },
424
  "advmod":{
425
+ "p":0.8163950144,
426
+ "r":0.8171785029,
427
+ "f":0.8167865707
428
  },
429
  "mark":{
430
+ "p":0.9122905028,
431
+ "r":0.9082313682,
432
+ "f":0.9102564103
433
  },
434
  "advcl":{
435
+ "p":0.6868327402,
436
+ "r":0.6620926244,
437
+ "f":0.6742358079
438
  },
439
  "obj":{
440
+ "p":0.8679588128,
441
+ "r":0.8889578164,
442
+ "f":0.8783328226
443
  },
444
  "case":{
445
+ "p":0.9327817994,
446
+ "r":0.9310967742,
447
+ "f":0.9319385251
448
  },
449
  "det":{
450
+ "p":0.9608091024,
451
+ "r":0.9620253165,
452
+ "f":0.9614168248
453
  },
454
  "obl":{
455
+ "p":0.7551117451,
456
+ "r":0.7185520362,
457
+ "f":0.7363783909
458
  },
459
  "aux":{
460
+ "p":0.9340560072,
461
+ "r":0.9357466063,
462
+ "f":0.9349005425
463
  },
464
  "acl:relcl":{
465
+ "p":0.8148148148,
466
+ "r":0.7927927928,
467
+ "f":0.803652968
468
  },
469
  "iobj":{
470
+ "p":0.7313432836,
471
+ "r":0.5568181818,
472
+ "f":0.6322580645
473
  },
474
  "xcomp":{
475
+ "p":0.6907894737,
476
+ "r":0.7142857143,
477
+ "f":0.7023411371
478
  },
479
  "cc":{
480
+ "p":0.9068322981,
481
+ "r":0.900539707,
482
+ "f":0.9036750484
483
  },
484
  "conj":{
485
+ "p":0.7009873061,
486
+ "r":0.721859114,
487
+ "f":0.7112701252
488
  },
489
  "amod":{
490
+ "p":0.9233110164,
491
+ "r":0.9188370684,
492
+ "f":0.9210686096
493
  },
494
  "nummod":{
495
+ "p":0.8996138996,
496
+ "r":0.9510204082,
497
+ "f":0.9246031746
498
  },
499
  "compound:prt":{
500
+ "p":0.8429118774,
501
+ "r":0.7942238267,
502
+ "f":0.8178438662
503
  },
504
  "cop":{
505
+ "p":0.858974359,
506
+ "r":0.8784266985,
507
+ "f":0.8685916323
508
  },
509
  "appos":{
510
+ "p":0.4242424242,
511
+ "r":0.28,
512
+ "f":0.3373493976
513
  },
514
  "ccomp":{
515
+ "p":0.8028673835,
516
+ "r":0.8818897638,
517
+ "f":0.8405253283
 
 
 
 
 
518
  },
519
  "acl":{
520
+ "p":0.6394849785,
521
+ "r":0.6008064516,
522
+ "f":0.6195426195
523
  },
524
  "csubj":{
525
+ "p":0.7307692308,
526
+ "r":0.6934306569,
527
+ "f":0.7116104869
528
+ },
529
+ "expl":{
530
+ "p":0.694235589,
531
+ "r":0.7486486486,
532
+ "f":0.7204161248
533
  },
534
  "nsubj:pass":{
535
+ "p":0.8316831683,
536
+ "r":0.7777777778,
537
+ "f":0.8038277512
538
  },
539
  "aux:pass":{
540
+ "p":0.9203539823,
541
+ "r":0.8666666667,
542
+ "f":0.8927038627
 
 
 
 
 
543
  },
544
  "acl:cleft":{
545
+ "p":0.4615384615,
546
+ "r":0.4444444444,
547
+ "f":0.4528301887
548
  },
549
  "orphan":{
550
+ "p":0.0,
551
+ "r":0.0,
552
+ "f":0.0
553
  },
554
  "dep":{
555
  "p":0.0,
 
561
  "r":0.0,
562
  "f":0.0
563
  },
564
+ "parataxis":{
565
+ "p":0.8243243243,
566
+ "r":0.6489361702,
567
+ "f":0.7261904762
568
  },
569
  "compound":{
570
+ "p":0.9,
571
+ "r":0.2195121951,
572
+ "f":0.3529411765
573
+ },
574
+ "flat:foreign":{
575
+ "p":0.3888888889,
576
+ "r":0.2258064516,
577
+ "f":0.2857142857
578
  },
579
  "discourse":{
580
+ "p":0.6923076923,
581
+ "r":0.3913043478,
582
+ "f":0.5
583
  },
584
  "csubj:pass":{
585
  "p":0.0,
 
587
  "f":0.0
588
  }
589
  },
590
+ "lemma_acc":0.9687620517,
591
+ "tag_acc":0.9676832796,
592
+ "ents_p":0.7702786378,
593
+ "ents_r":0.7369668246,
594
+ "ents_f":0.753254617,
595
  "ents_per_type":{
596
  "PER":{
597
+ "p":0.8344262295,
598
+ "r":0.8330605565,
599
+ "f":0.8337428337
600
  },
601
+ "PROD":{
602
+ "p":0.6240601504,
603
+ "r":0.512345679,
604
+ "f":0.5627118644
605
  },
606
  "GPE_LOC":{
607
+ "p":0.7791164659,
608
+ "r":0.749034749,
609
+ "f":0.7637795276
610
  },
611
+ "ORG":{
612
+ "p":0.7772397094,
613
+ "r":0.7945544554,
614
+ "f":0.7858017136
 
 
 
 
 
615
  },
616
  "LOC":{
617
+ "p":0.5208333333,
618
+ "r":0.4587155963,
619
+ "f":0.487804878
620
+ },
621
+ "DRV":{
622
+ "p":0.7866666667,
623
+ "r":0.746835443,
624
+ "f":0.7662337662
625
  },
626
  "GPE_ORG":{
627
+ "p":0.7058823529,
628
+ "r":0.4363636364,
629
+ "f":0.5393258427
630
  },
631
  "EVT":{
632
+ "p":0.8,
633
  "r":0.4444444444,
634
+ "f":0.5714285714
635
  }
636
  },
637
+ "speed":13912.0236342851
638
  },
639
  "sources":[
640
  {
morphologizer/cfg CHANGED
@@ -123,6 +123,7 @@
123
  "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Dem":"Definite=Ind|Gender=Masc|Number=Sing|PronType=Dem",
124
  "Case=Gen|Definite=Def|Gender=Fem|Number=Plur|POS=NOUN":"Case=Gen|Definite=Def|Gender=Fem|Number=Plur",
125
  "Case=Gen|Gender=Neut|Number=Sing|POS=DET|PronType=Dem":"Case=Gen|Gender=Neut|Number=Sing|PronType=Dem",
 
126
  "Animacy=Hum|Number=Sing|POS=PRON|PronType=Art,Prs":"Animacy=Hum|Number=Sing|PronType=Art,Prs",
127
  "Mood=Imp|POS=AUX|VerbForm=Fin":"Mood=Imp|VerbForm=Fin",
128
  "Number=Plur|POS=PRON|Person=3|PronType=Prs,Tot":"Number=Plur|Person=3|PronType=Prs,Tot",
@@ -328,6 +329,7 @@
328
  "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Dem":90,
329
  "Case=Gen|Definite=Def|Gender=Fem|Number=Plur|POS=NOUN":92,
330
  "Case=Gen|Gender=Neut|Number=Sing|POS=DET|PronType=Dem":90,
 
331
  "Animacy=Hum|Number=Sing|POS=PRON|PronType=Art,Prs":95,
332
  "Mood=Imp|POS=AUX|VerbForm=Fin":87,
333
  "Number=Plur|POS=PRON|Person=3|PronType=Prs,Tot":95,
 
123
  "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Dem":"Definite=Ind|Gender=Masc|Number=Sing|PronType=Dem",
124
  "Case=Gen|Definite=Def|Gender=Fem|Number=Plur|POS=NOUN":"Case=Gen|Definite=Def|Gender=Fem|Number=Plur",
125
  "Case=Gen|Gender=Neut|Number=Sing|POS=DET|PronType=Dem":"Case=Gen|Gender=Neut|Number=Sing|PronType=Dem",
126
+ "POS=SPACE":"",
127
  "Animacy=Hum|Number=Sing|POS=PRON|PronType=Art,Prs":"Animacy=Hum|Number=Sing|PronType=Art,Prs",
128
  "Mood=Imp|POS=AUX|VerbForm=Fin":"Mood=Imp|VerbForm=Fin",
129
  "Number=Plur|POS=PRON|Person=3|PronType=Prs,Tot":"Number=Plur|Person=3|PronType=Prs,Tot",
 
329
  "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Dem":90,
330
  "Case=Gen|Definite=Def|Gender=Fem|Number=Plur|POS=NOUN":92,
331
  "Case=Gen|Gender=Neut|Number=Sing|POS=DET|PronType=Dem":90,
332
+ "POS=SPACE":103,
333
  "Animacy=Hum|Number=Sing|POS=PRON|PronType=Art,Prs":95,
334
  "Mood=Imp|POS=AUX|VerbForm=Fin":87,
335
  "Number=Plur|POS=PRON|Person=3|PronType=Prs,Tot":95,
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5ce9e33d7eb0476ac53bb10d9dcb951c6ad0c4b67b5956c354e7f52e4f307a0
3
- size 79201
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17cfb00cce8099991f07c5fb940f69fab2eb623f7c5a961e38e780a86bdcff78
3
+ size 79589
nb_core_news_sm-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf8c67018ce5509e0cb1d405b2475db1ff20dab59db89c5e1ca3a455aec9898a
3
- size 12489487
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae9747927cef239565a8d1c454b0df4f4d7698599eba1bc92d1f4a50dd0baa85
3
+ size 12474334
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3bb3a7a0f649ee154d87380396c29ca90c33527cb9097b0d6f558521753f5af
3
  size 6275402
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:027ef8651b9eebebc9f90826a79a37f6329139b961cb77ecdac9bfd827b9fe86
3
  size 6275402
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves��{"0":{},"1":{"PER":6378,"ORG":3793,"GPE_LOC":2278,"PROD":1284,"LOC":842,"DRV":640,"GPE_ORG":410,"EVT":201,"MISC":12},"2":{"PER":6378,"ORG":3793,"GPE_LOC":2278,"PROD":1284,"LOC":842,"DRV":640,"GPE_ORG":410,"EVT":201,"MISC":12},"3":{"PER":6378,"ORG":3793,"GPE_LOC":2278,"PROD":1284,"LOC":842,"DRV":640,"GPE_ORG":410,"EVT":201,"MISC":12},"4":{"PER":6378,"ORG":3793,"GPE_LOC":2278,"PROD":1284,"LOC":842,"DRV":640,"GPE_ORG":410,"EVT":201,"MISC":12,"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��moves��{"0":{},"1":{"PER":6387,"ORG":3797,"GPE_LOC":2281,"PROD":1286,"LOC":842,"DRV":641,"GPE_ORG":410,"EVT":201,"MISC":12},"2":{"PER":6387,"ORG":3797,"GPE_LOC":2281,"PROD":1286,"LOC":842,"DRV":641,"GPE_ORG":410,"EVT":201,"MISC":12},"3":{"PER":6387,"ORG":3797,"GPE_LOC":2281,"PROD":1286,"LOC":842,"DRV":641,"GPE_ORG":410,"EVT":201,"MISC":12},"4":{"PER":6387,"ORG":3797,"GPE_LOC":2281,"PROD":1286,"LOC":842,"DRV":641,"GPE_ORG":410,"EVT":201,"MISC":12,"":1},"5":{"":1}}�cfg��neg_key�
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:727ffbff43f25594eed8339baabc402b762c7ee505c02de03406f79e05e6a005
3
  size 308989
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b78f8cbf6ffc4149c6b99d03f5e288944f0843218ee5b68840ee9c64f6c90ca9
3
  size 308989
parser/moves CHANGED
@@ -1 +1 @@
1
- ��moves�~{"0":{"":134900},"1":{"":93292},"2":{"case":25334,"nsubj":18615,"mark":12192,"amod":10711,"det":10563,"punct":10025,"advmod":9967,"cc":8383,"aux":6803,"cop":5514,"nmod":5449,"obl":2945,"expl":2092,"nummod":1827,"nsubj:pass":1366,"aux:pass":862,"advcl":759,"obj":572,"compound":239,"discourse":89,"csubj":88,"compound:prt":83,"iobj":77,"xcomp":53,"acl||nsubj":51,"dep":0},"3":{"punct":19146,"obl":11656,"obj":10276,"nmod":10154,"conj":9408,"advmod":4274,"flat:name":4150,"nsubj":3717,"advcl":3241,"xcomp":3108,"acl:relcl":3075,"compound:prt":1947,"ccomp":1749,"acl":1257,"parataxis":1103,"csubj":693,"appos":637,"iobj":469,"expl":457,"flat:foreign":365,"amod":328,"acl:cleft":255,"cop":192,"det":179,"orphan":163,"advcl||advmod":161,"acl||nsubj":161,"case||obl":129,"obl||advmod":87,"nsubj:pass":81,"obl||amod":65,"obl||det":56,"appos||nsubj":38,"acl||nsubj:pass":34,"dep":0},"4":{"ROOT":15696}}�cfg��neg_key�
 
1
+ ��moves��{"0":{"":134903},"1":{"":94491},"2":{"case":25334,"nsubj":18615,"mark":12192,"amod":10711,"det":10563,"punct":10025,"advmod":9967,"cc":8383,"aux":6803,"cop":5514,"nmod":5449,"obl":2945,"expl":2092,"nummod":1827,"nsubj:pass":1366,"aux:pass":862,"advcl":759,"obj":572,"compound":239,"discourse":89,"csubj":88,"compound:prt":83,"iobj":77,"xcomp":53,"acl||nsubj":51,"dep":0},"3":{"punct":19146,"obl":11656,"obj":10276,"nmod":10154,"conj":9408,"advmod":4274,"flat:name":4150,"nsubj":3717,"advcl":3241,"xcomp":3108,"acl:relcl":3075,"compound:prt":1947,"ccomp":1749,"acl":1257,"dep":1199,"parataxis":1103,"csubj":693,"appos":637,"iobj":469,"expl":457,"flat:foreign":365,"amod":328,"acl:cleft":255,"cop":192,"det":179,"orphan":163,"advcl||advmod":161,"acl||nsubj":161,"case||obl":129,"obl||advmod":87,"nsubj:pass":81,"obl||amod":65,"obl||det":56,"appos||nsubj":38,"acl||nsubj:pass":34},"4":{"ROOT":15696}}�cfg��neg_key�
senter/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5516bc7097f3fa3a7281019aca23473ed9fb29a60f582dd0fd59ff8b72589e02
3
  size 197089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4a6e9d55ce6a3a0f205d0bea15eaae04712ab41340a16978644eb66fa3e9bd9
3
  size 197089
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b74769b286263e8cc4468b3e892808486256c343d2bd411042b672a5782d77d6
3
  size 6139229
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:361abf51a0166a31fe77592903ca6850e76c22a420076dbc3b395f56c5e4523d
3
  size 6139229
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f50f0a72c6e46876bddbc301881c4f9436e3000b94c82e7c3ac46ab20edc4eaf
3
- size 813963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52eadd082fbac7de5c607eabb89a5afb92facf888acb7c85c34ea98b492c57e1
3
+ size 821451