firqaaa commited on
Commit
968e575
1 Parent(s): 355be29

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -13,68 +13,68 @@ model-index:
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
- value: 0.0
17
  - name: NER Recall
18
  type: recall
19
- value: 0.0
20
  - name: NER F Score
21
  type: f_score
22
- value: 0.0
23
  - task:
24
  name: TAG
25
  type: token-classification
26
  metrics:
27
  - name: TAG (XPOS) Accuracy
28
  type: accuracy
29
- value: 0.9058429775
30
  - task:
31
  name: POS
32
  type: token-classification
33
  metrics:
34
  - name: POS (UPOS) Accuracy
35
  type: accuracy
36
- value: 0.911077953
37
  - task:
38
  name: MORPH
39
  type: token-classification
40
  metrics:
41
  - name: Morph (UFeats) Accuracy
42
  type: accuracy
43
- value: 0.924529063
44
  - task:
45
  name: LEMMA
46
  type: token-classification
47
  metrics:
48
  - name: Lemma Accuracy
49
  type: accuracy
50
- value: 0.9356240444
51
  - task:
52
  name: UNLABELED_DEPENDENCIES
53
  type: token-classification
54
  metrics:
55
  - name: Unlabeled Attachment Score (UAS)
56
  type: f_score
57
- value: 0.779082277
58
  - task:
59
  name: LABELED_DEPENDENCIES
60
  type: token-classification
61
  metrics:
62
  - name: Labeled Attachment Score (LAS)
63
  type: f_score
64
- value: 0.6971807939
65
  - task:
66
  name: SENTS
67
  type: token-classification
68
  metrics:
69
  - name: Sentences F-Score
70
  type: f_score
71
- value: 0.9099018733
72
  ---
73
  | Feature | Description |
74
  | --- | --- |
75
  | **Name** | `id_core_news_sm` |
76
- | **Version** | `0.0.2` |
77
- | **spaCy** | `>=3.7.4,<3.8.0` |
78
  | **Default Pipeline** | `tok2vec`, `ner`, `tagger`, `morphologizer`, `trainable_lemmatizer`, `parser` |
79
  | **Components** | `tok2vec`, `ner`, `tagger`, `morphologizer`, `trainable_lemmatizer`, `parser` |
80
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -86,13 +86,14 @@ model-index:
86
 
87
  <details>
88
 
89
- <summary>View label scheme (166 labels for 3 components)</summary>
90
 
91
  | Component | Labels |
92
  | --- | --- |
93
- | **`tagger`** | `APP`, `ASP`, `ASP+PS3`, `ASS`, `B--`, `B--+PS3`, `CC-`, `CCONJ`, `CD-`, `CO-`, `D--`, `D--+PS3`, `F--`, `F--+PS2`, `G--`, `G--+PS3`, `H--`, `I--`, `M--`, `M--+PS3`, `NOUN`, `NPD`, `NSD`, `NSD+PS3`, `NSF`, `NSM`, `NUM`, `O--`, `PP1`, `PP2`, `PP3`, `PROPN`, `PS1`, `PS1+VSA`, `PS2`, `PS3`, `R--`, `R--+PS3`, `S--`, `SYM`, `T--`, `VERB`, `VPA`, `VSA`, `VSA+PS2`, `VSA+PS3`, `VSP`, `W--`, `X--`, `Z--` |
94
- | **`morphologizer`** | `POS=PROPN`, `POS=AUX`, `Definite=Ind\|POS=DET\|PronType=Art`, `Number=Sing\|POS=NOUN`, `POS=PRON\|PronType=Rel`, `Mood=Ind\|POS=VERB\|Voice=Pass`, `POS=ADP`, `POS=PUNCT`, `POS=NOUN`, `POS=ADV`, `POS=CCONJ`, `POS=SCONJ`, `Mood=Ind\|POS=VERB\|Voice=Act`, `POS=VERB`, `POS=DET\|PronType=Tot`, `Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `POS=PRON\|PronType=Prs\|Reflex=Yes`, `POS=DET\|PronType=Dem`, `NumType=Card\|POS=NUM`, `POS=ADJ`, `Number=Plur\|POS=DET\|PronType=Ind`, `NumType=Card\|POS=NUM\|PronType=Tot`, `POS=PART\|Polarity=Neg`, `POS=PRON\|PronType=Int`, `NumType=Ord\|POS=ADJ`, `POS=PART`, `POS=PRON\|PronType=Dem`, `POS=DET\|PronType=Ind`, `Number=Plur\|POS=NOUN`, `Number=Sing\|POS=PRON\|Person=1\|Polite=Form\|PronType=Prs`, `POS=ADV\|PronType=Int`, `Clusivity=In\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Definite=Def\|POS=DET\|PronType=Art`, `POS=SYM`, `Degree=Sup\|POS=ADJ`, `POS=INTJ`, `Number=Sing\|POS=PRON\|Person=2\|Polite=Infm\|PronType=Prs`, `POS=ADV\|PronType=Ind`, `Number=Sing\|POS=PRON\|Person=3\|Polite=Form\|PronType=Prs`, `Number=Sing\|POS=PRON\|Person=1\|Polite=Infm\|PronType=Prs`, `Number=Sing\|POS=PRON\|PronType=Ind`, `POS=VERB\|Voice=Act`, `POS=DET\|PronType=Emp`, `POS=VERB\|Voice=Pass`, `POS=ADV\|PronType=Dem`, `POS=NOUN\|Typo=Yes`, `POS=ADP\|Typo=Yes`, `Number=Plur\|POS=PRON\|PronType=Ind`, `POS=VERB\|Typo=Yes\|Voice=Pass`, `POS=X`, `POS=PRON\|PronType=Tot`, `POS=SCONJ\|Typo=Yes`, `Number=Plur\|POS=PRON\|Person=2\|Polite=Infm\|PronType=Prs`, `NumType=Card\|POS=NUM\|Typo=Yes`, `Clusivity=Ex\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Number=Sing\|POS=PRON\|Person=2\|Polite=Form\|PronType=Prs`, `Foreign=Yes\|POS=X`, `POS=ADV\|PronType=Rel`, `Mood=Imp\|POS=VERB\|Voice=Act`, `Number=Sing\|POS=NOUN\|Typo=Yes`, `POS=PROPN\|Typo=Yes`, `POS=DET`, `Number=Sing\|POS=DET\|PronType=Ind`, `POS=DET\|PronType=Ind\|Typo=Yes`, `Abbr=Yes\|POS=DET\|PronType=Dem`, `POS=PRON\|PronType=Ind`, `POS=VERB\|Typo=Yes`, `Abbr=Yes\|POS=PROPN`, `Abbr=Yes\|POS=PRON\|PronType=Rel`, `Number=Plur\|POS=PRON\|PronType=Int`, `Abbr=Yes\|POS=PART\|Polarity=Neg`, `POS=ADV\|PronType=Tot`, `Abbr=Yes\|POS=ADV`, `POS=ADV\|Typo=Yes`, `POS=X\|Typo=Yes`, `Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `POS=ADV\|PronType=Int\|Typo=Yes`, `NumType=Ord\|POS=ADJ\|Typo=Yes` |
95
- | **`parser`** | `ROOT`, `acl`, `acl:relcl`, `advcl`, `advmod`, `advmod:emph`, `amod`, `appos`, `aux`, `case`, `case:adv`, `cc`, `ccomp`, `compound`, `conj`, `cop`, `dep`, `det`, `fixed`, `flat`, `flat:foreign`, `flat:name`, `mark`, `nmod`, `nmod:lmod`, `nmod:poss`, `nmod:tmod`, `nsubj`, `nsubj:pass`, `nummod`, `obj`, `obl`, `obl:agent`, `obl:tmod`, `parataxis`, `punct`, `xcomp` |
 
96
 
97
  </details>
98
 
@@ -100,22 +101,21 @@ model-index:
100
 
101
  | Type | Score |
102
  | --- | --- |
103
- | `ENTS_F` | 0.00 |
104
- | `ENTS_P` | 0.00 |
105
- | `ENTS_R` | 0.00 |
106
- | `ENTS_PER_TYPE` | 0.00 |
107
- | `TAG_ACC` | 90.58 |
108
- | `POS_ACC` | 91.11 |
109
- | `MORPH_ACC` | 92.45 |
110
- | `LEMMA_ACC` | 93.56 |
111
- | `DEP_UAS` | 77.91 |
112
- | `DEP_LAS` | 69.72 |
113
- | `SENTS_P` | 90.75 |
114
- | `SENTS_R` | 91.23 |
115
- | `SENTS_F` | 90.99 |
116
- | `TOK2VEC_LOSS` | 834213.16 |
117
- | `NER_LOSS` | 0.00 |
118
- | `TAGGER_LOSS` | 57215.06 |
119
- | `MORPHOLOGIZER_LOSS` | 124661.48 |
120
- | `TRAINABLE_LEMMATIZER_LOSS` | 24560.71 |
121
- | `PARSER_LOSS` | 882915.56 |
 
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
+ value: 0.7083118224
17
  - name: NER Recall
18
  type: recall
19
+ value: 0.7101449275
20
  - name: NER F Score
21
  type: f_score
22
+ value: 0.7092271905
23
  - task:
24
  name: TAG
25
  type: token-classification
26
  metrics:
27
  - name: TAG (XPOS) Accuracy
28
  type: accuracy
29
+ value: 0.924552227
30
  - task:
31
  name: POS
32
  type: token-classification
33
  metrics:
34
  - name: POS (UPOS) Accuracy
35
  type: accuracy
36
+ value: 0.9237476221
37
  - task:
38
  name: MORPH
39
  type: token-classification
40
  metrics:
41
  - name: Morph (UFeats) Accuracy
42
  type: accuracy
43
+ value: 0.9444730688
44
  - task:
45
  name: LEMMA
46
  type: token-classification
47
  metrics:
48
  - name: Lemma Accuracy
49
  type: accuracy
50
+ value: 0.9719515094
51
  - task:
52
  name: UNLABELED_DEPENDENCIES
53
  type: token-classification
54
  metrics:
55
  - name: Unlabeled Attachment Score (UAS)
56
  type: f_score
57
+ value: 0.817370892
58
  - task:
59
  name: LABELED_DEPENDENCIES
60
  type: token-classification
61
  metrics:
62
  - name: Labeled Attachment Score (LAS)
63
  type: f_score
64
+ value: 0.7299441393
65
  - task:
66
  name: SENTS
67
  type: token-classification
68
  metrics:
69
  - name: Sentences F-Score
70
  type: f_score
71
+ value: 0.8908450704
72
  ---
73
  | Feature | Description |
74
  | --- | --- |
75
  | **Name** | `id_core_news_sm` |
76
+ | **Version** | `0.0.3` |
77
+ | **spaCy** | `>=3.7.0,<3.8.0` |
78
  | **Default Pipeline** | `tok2vec`, `ner`, `tagger`, `morphologizer`, `trainable_lemmatizer`, `parser` |
79
  | **Components** | `tok2vec`, `ner`, `tagger`, `morphologizer`, `trainable_lemmatizer`, `parser` |
80
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
86
 
87
  <details>
88
 
89
+ <summary>View label scheme (321 labels for 4 components)</summary>
90
 
91
  | Component | Labels |
92
  | --- | --- |
93
+ | **`ner`** | `CARDINAL`, `DATE`, `EVENT`, `FAC`, `GPE`, `LANGUAGE`, `LAW`, `LOC`, `MONEY`, `NORP`, `ORDINAL`, `ORG`, `PERCENT`, `PERSON`, `PRODUCT`, `QUANTITY`, `TIME`, `WORK_OF_ART` |
94
+ | **`tagger`** | `APP`, `ASP`, `ASP+PS2`, `ASP+PS3`, `ASP+T--`, `ASS`, `ASS+PS3`, `B--`, `B--+PS3`, `B--+T--`, `CC-`, `CC-+PS3`, `CC-+T--`, `CD-`, `CD-+PS3`, `CO-`, `CO-+PS3`, `D--`, `D--+PS2`, `D--+PS3`, `D--+T--`, `F--`, `F--+PS1`, `F--+PS2`, `F--+PS3`, `F--+T--`, `G--`, `G--+PS3`, `G--+T--`, `H--`, `H--+T--`, `I--`, `M--`, `M--+PS3`, `M--+T--`, `NOUN`, `NPD`, `NPD+PS2`, `NPD+PS3`, `NSD`, `NSD+PS1`, `NSD+PS2`, `NSD+PS3`, `NSD+T--`, `NSF`, `NSM`, `NSM+PS3`, `NUM`, `O--`, `PP1`, `PP1+T--`, `PP2`, `PP3`, `PP3+T--`, `PROPN`, `PS1`, `PS1+VSA`, `PS1+VSA+T--`, `PS2`, `PS2+VSA`, `PS3`, `PUNCT`, `R--`, `R--+PS1`, `R--+PS2`, `R--+PS3`, `S--`, `S--+PS3`, `T--`, `VERB`, `VPA`, `VSA`, `VSA+PS1`, `VSA+PS2`, `VSA+PS3`, `VSA+T--`, `VSP`, `VSP+PS3`, `VSP+T--`, `W--`, `W--+T--`, `X`, `X--`, `Z--` |
95
+ | **`morphologizer`** | `POS=PROPN`, `POS=AUX`, `POS=DET\|PronType=Ind`, `Number=Sing\|POS=NOUN`, `POS=PRON\|PronType=Rel`, `Number=Sing\|POS=VERB\|Voice=Pass`, `POS=ADP`, `POS=PUNCT`, `Number=Sing\|POS=PROPN`, `POS=NOUN`, `POS=ADV`, `POS=CCONJ`, `Number=Sing\|POS=VERB\|Voice=Act`, `POS=VERB`, `POS=DET\|PronType=Tot`, `Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=3`, `POS=SCONJ`, `Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `POS=DET\|PronType=Dem`, `NumType=Card\|POS=NUM`, `Degree=Pos\|Number=Sing\|POS=NOUN`, `Degree=Pos\|Number=Sing\|POS=ADJ`, `NumType=Card\|POS=DET\|PronType=Ind`, `Degree=Pos\|Number=Sing\|POS=ADP`, `Number[psor]=Sing\|POS=NOUN\|Person[psor]=3`, `Number=Sing\|POS=VERB`, `POS=PRON\|PronType=Int`, `Number=Sing\|POS=ADV\|Voice=Act`, `Number=Sing\|Number[psor]=Sing\|POS=VERB\|Person[psor]=3\|Voice=Act`, `Number=Sing\|POS=ADP\|Voice=Act`, `POS=ADJ`, `Number[psor]=Sing\|POS=ADP\|Person[psor]=3`, `Degree=Pos\|Number=Sing\|POS=DET`, `Degree=Pos\|Number=Sing\|POS=VERB`, `POS=PRON\|PronType=Dem`, `POS=PART\|Polarity=Neg`, `Degree=Pos\|Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=3`, `Number=Sing\|POS=PRON\|Person=1\|Polite=Form\|PronType=Prs`, `Number=Sing\|POS=ADJ`, `Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `POS=SYM`, `POS=ADV\|PronType=Int`, `Clusivity=In\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Number=Sing\|POS=ADJ\|Voice=Act`, `Degree=Pos\|Number=Sing\|POS=PROPN`, `Degree=Pos\|Number=Sing\|POS=ADV`, `Number=Sing\|Number[psor]=Sing\|POS=VERB\|Person[psor]=3\|Voice=Pass`, `Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=3\|Voice=Act`, `Number=Sing\|POS=PROPN\|Voice=Act`, `Number=Sing\|POS=NOUN\|Voice=Act`, `POS=DET`, `Number=Sing\|POS=DET\|Voice=Act`, `NumType=Card\|POS=PRON\|PronType=Ind`, `Number=Sing\|Number[psor]=Sing\|POS=ADV\|Person[psor]=3`, `Number=Sing\|POS=DET`, `Number=Sing\|POS=ADJ\|Voice=Pass`, `POS=CCONJ\|PronType=Dem`, `Number=Sing\|POS=ADP`, `Number=Sing\|POS=ADV`, `Number=Sing\|POS=PRON\|Person=2\|Polite=Infm\|PronType=Prs`, `Number[psor]=Sing\|POS=NOUN\|Person[psor]=2`, `Number=Plur\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=2`, `Number=Sing\|POS=PRON`, `POS=PRON`, `NumType=Card\|POS=ADV\|PronType=Ind`, `NumType=Card\|Number[psor]=Sing\|POS=NUM\|Person[psor]=3`, `Number=Sing\|POS=PRON\|Person=3\|Polite=Form\|PronType=Prs`, `POS=DET\|PronType=Int`, `Number=Sing\|Number[psor]=Sing\|POS=PROPN\|Person[psor]=3`, `Number=Sing\|Number[psor]=Sing\|POS=PROPN\|Person[psor]=1`, `Degree=Pos\|Number=Sing\|POS=SCONJ`, `POS=PRON\|PronType=Ind`, `Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=3\|Voice=Pass`, `POS=VERB\|PronType=Ind`, `Degree=Pos\|Number=Sing\|Number[psor]=Sing\|POS=ADJ\|Person[psor]=3`, `Number=Sing\|POS=SCONJ`, `Degree=Sup\|Number=Sing\|Number[psor]=Sing\|POS=ADJ\|Person[psor]=3`, `Degree=Pos\|Number=Sing\|Number[psor]=Sing\|POS=ADP\|Person[psor]=3`, `Number=Plur\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=3`, `Number=Plur\|POS=NOUN`, `POS=ADV\|PronType=Dem`, `Number=Sing\|POS=VERB\|Person=1\|Voice=Act`, `Degree=Sup\|Number=Sing\|POS=ADJ`, `Number=Sing\|POS=ADP\|Voice=Pass`, `Number[psor]=Sing\|POS=PART\|Person[psor]=3`, `Number=Sing\|POS=NOUN\|Voice=Pass`, `Degree=Pos\|Number=Sing\|Number[psor]=Sing\|POS=CCONJ\|Person[psor]=3`, `POS=PART`, `Number=Sing\|Number[psor]=Sing\|POS=PART\|Person[psor]=3\|Voice=Pass`, `Degree=Sup\|Number=Sing\|POS=ADV`, `Number=Sing\|POS=PRON\|Voice=Act`, `Number=Sing\|Number[psor]=Sing\|POS=PROPN\|Person[psor]=3\|Voice=Act`, `Gender=Masc\|Number=Sing\|POS=PROPN`, `Number[psor]=Sing\|POS=PRON\|Person[psor]=3\|PronType=Tot`, `Degree=Pos\|Number=Sing\|POS=X`, `POS=PRON\|PronType=Tot`, `Degree=Pos\|Number=Sing\|Number[psor]=Sing\|POS=ADV\|Person[psor]=3`, `Degree=Pos\|Number=Sing\|Number[psor]=Sing\|POS=VERB\|Person[psor]=3`, `Number=Sing\|Number[psor]=Sing\|POS=ADP\|Person[psor]=3`, `Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=2`, `POS=SCONJ\|PronType=Int`, `Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Number=Sing\|Number[psor]=Sing\|POS=VERB\|Person[psor]=1\|Voice=Act`, `Number[psor]=Sing\|POS=DET\|Person[psor]=3`, `Number=Sing\|Number[psor]=Sing\|POS=PRON\|Person[psor]=3`, `Clusivity=Ex\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Number=Plur\|POS=VERB\|Voice=Act`, `Number=Sing\|Number[psor]=Sing\|POS=ADV\|Person[psor]=3\|Voice=Act`, `Degree=Pos\|Number=Sing\|POS=NOUN\|Polarity=Neg`, `POS=X`, `Number[psor]=Sing\|POS=ADJ\|Person[psor]=3`, `Number=Sing\|Number[psor]=Sing\|POS=VERB\|Person[psor]=3`, `Number=Sing\|POS=PRON\|Person=2\|Polite=Form\|PronType=Prs`, `Number=Sing\|POS=PRON\|Person=1\|Polite=Infm\|PronType=Prs`, `Number=Sing\|POS=PROPN\|Voice=Pass`, `POS=ADV\|Polarity=Neg`, `NumType=Card\|Number=Sing\|POS=NUM`, `Number[psor]=Sing\|POS=ADV\|Person[psor]=2`, `Number[psor]=Sing\|POS=ADV\|Person[psor]=3`, `Degree=Sup\|Number=Sing\|POS=PROPN`, `POS=PROPN\|Polarity=Neg`, `Number=Sing\|Number[psor]=Sing\|POS=VERB\|Person[psor]=2\|Voice=Act`, `Number=Sing\|POS=PROPN\|Person=1\|Voice=Act`, `POS=SCONJ\|PronType=Dem`, `Number=Sing\|Number[psor]=Sing\|POS=ADV\|Person[psor]=2\|Voice=Act`, `Number=Sing\|POS=CCONJ`, `Degree=Sup\|Number=Sing\|POS=VERB`, `Number=Sing\|Number[psor]=Sing\|POS=ADJ\|Person[psor]=3`, `Number=Sing\|Number[psor]=Sing\|POS=ADJ\|Person[psor]=3\|Voice=Act`, `Degree=Pos\|Number=Sing\|POS=PRON`, `Number=Sing\|POS=ADV\|Voice=Pass`, `Number[psor]=Sing\|POS=ADP\|Person[psor]=2`, `Number=Sing\|POS=SYM`, `POS=ADJ\|Polarity=Neg`, `Degree=Pos\|NumType=Card\|Number=Sing\|POS=NUM`, `Number=Sing\|Number[psor]=Sing\|POS=SCONJ\|Person[psor]=3`, `Degree=Pos\|Number=Sing\|POS=CCONJ`, `Number[psor]=Sing\|POS=NOUN\|Person[psor]=1`, `Number=Sing\|POS=CCONJ\|Voice=Act`, `Gender=Masc\|Number=Sing\|POS=NOUN`, `Number=Sing\|Number[psor]=Sing\|POS=ADP\|Person[psor]=3\|Voice=Pass`, `Gender=Fem\|Number=Sing\|POS=PROPN`, `POS=VERB\|PronType=Dem`, `Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Gender=Masc\|Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=3`, `Number=Sing\|POS=PART\|Voice=Act`, `Degree=Sup\|Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=3`, `POS=ADP\|PronType=Int`, `Number[psor]=Sing\|POS=VERB\|Person[psor]=3`, `Number[psor]=Sing\|POS=PRON\|Person[psor]=3\|PronType=Rel`, `Degree=Pos\|Number=Sing\|POS=AUX`, `Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=1`, `Number=Sing\|POS=SCONJ\|Voice=Pass`, `Degree=Sup\|Number=Sing\|POS=ADP`, `Number=Sing\|POS=SCONJ\|Voice=Act`, `NumType=Card\|POS=DET\|PronType=Int`, `Degree=Pos\|Number=Sing\|POS=PART\|Polarity=Neg`, `Degree=Sup\|Number=Sing\|POS=SCONJ`, `Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=1\|Voice=Act`, `Number=Plur\|POS=ADJ`, `POS=VERB\|PronType=Int`, `Number=Sing\|POS=VERB\|Person=2\|Voice=Act`, `Degree=Pos\|Number=Sing\|Number[psor]=Sing\|POS=ADJ\|Person[psor]=2`, `Gender=Masc\|Number=Sing\|POS=ADJ`, `Number[psor]=Sing\|POS=ADV\|Person[psor]=3\|PronType=Tot`, `POS=DET\|PronType=Rel`, `Number=Sing\|POS=NOUN\|Polarity=Neg`, `Number=Sing\|Number[psor]=Sing\|POS=PROPN\|Person[psor]=2`, `NumType=Card\|Number=Sing\|POS=NUM\|Voice=Act`, `Degree=Pos\|Number=Plur\|POS=ADJ`, `Number[psor]=Sing\|POS=DET\|Person[psor]=3\|PronType=Tot`, `Number[psor]=Sing\|POS=PROPN\|Person[psor]=1`, `Gender=Fem\|Number=Sing\|POS=NOUN`, `Number=Sing\|POS=VERB\|Person=1`, `Degree=Pos\|Number=Sing\|Number[psor]=Sing\|POS=PROPN\|Person[psor]=3`, `NumType=Card\|Number[psor]=Sing\|POS=DET\|Person[psor]=3\|PronType=Ind`, `POS=ADV\|PronType=Tot`, `Degree=Pos\|Number=Plur\|POS=ADV`, `Number=Plur\|POS=ADV\|Voice=Act`, `POS=CCONJ\|PronType=Int`, `Degree=Pos\|Number=Sing\|POS=PART`, `Number[psor]=Sing\|POS=PRON\|Person[psor]=2`, `Number=Plur\|POS=VERB`, `Number=Sing\|Number[psor]=Sing\|POS=ADJ\|Person[psor]=3\|Voice=Pass`, `Degree=Pos\|Number=Sing\|POS=PUNCT`, `Number[psor]=Sing\|POS=ADP\|Person[psor]=1`, `Degree=Sup\|Number=Sing\|POS=NOUN`, `Number[psor]=Sing\|POS=PART\|Person[psor]=3\|Polarity=Neg`, `Number=Sing\|Number[psor]=Sing\|POS=ADP\|Person[psor]=3\|Voice=Act`, `POS=NOUN\|Polarity=Neg`, `Number[psor]=Sing\|POS=PROPN\|Person[psor]=2`, `Number=Sing\|Number[psor]=Sing\|POS=NOUN\|Person[psor]=2\|Voice=Act` |
96
+ | **`parser`** | `ROOT`, `acl`, `advcl`, `advmod`, `amod`, `appos`, `case`, `cc`, `ccomp`, `compound`, `compound:plur`, `conj`, `cop`, `dep`, `det`, `fixed`, `flat`, `mark`, `nmod`, `nsubj`, `nsubj:pass`, `nummod`, `obj`, `obl`, `parataxis`, `punct`, `xcomp` |
97
 
98
  </details>
99
 
 
101
 
102
  | Type | Score |
103
  | --- | --- |
104
+ | `ENTS_F` | 70.92 |
105
+ | `ENTS_P` | 70.83 |
106
+ | `ENTS_R` | 71.01 |
107
+ | `TAG_ACC` | 92.46 |
108
+ | `POS_ACC` | 92.37 |
109
+ | `MORPH_ACC` | 94.45 |
110
+ | `LEMMA_ACC` | 97.20 |
111
+ | `DEP_UAS` | 81.74 |
112
+ | `DEP_LAS` | 72.99 |
113
+ | `SENTS_P` | 87.69 |
114
+ | `SENTS_R` | 90.52 |
115
+ | `SENTS_F` | 89.08 |
116
+ | `TOK2VEC_LOSS` | 1297727.43 |
117
+ | `NER_LOSS` | 96670.57 |
118
+ | `TAGGER_LOSS` | 56378.18 |
119
+ | `MORPHOLOGIZER_LOSS` | 164858.35 |
120
+ | `TRAINABLE_LEMMATIZER_LOSS` | 16646.19 |
121
+ | `PARSER_LOSS` | 930045.93 |
 
config.cfg CHANGED
@@ -1,6 +1,6 @@
1
  [paths]
2
- train = "./id_gsd-ud-train.spacy"
3
- dev = "./id_gsd-ud-dev.spacy"
4
  vectors = null
5
  init_tok2vec = null
6
 
 
1
  [paths]
2
+ train = "./output-train.spacy"
3
+ dev = "./output-dev.spacy"
4
  vectors = null
5
  init_tok2vec = null
6
 
id_core_news_sm-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c89d501e10ca94b399fb58b812f28a8d55848c6c8f3b58ed0d8f06465957d91
3
- size 34239071
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72bac69325eb27405bbaa6256001a173a762fc1759b080061ed65e2aa88242e3
3
+ size 34294361
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"id",
3
  "name":"core_news_sm",
4
- "version":"0.0.2",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
- "spacy_version":">=3.7.4,<3.8.0",
11
- "spacy_git_version":"bff8725f4",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -20,176 +20,330 @@
20
 
21
  ],
22
  "ner":[
23
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
  ],
25
  "tagger":[
26
  "APP",
27
  "ASP",
 
28
  "ASP+PS3",
 
29
  "ASS",
 
30
  "B--",
31
  "B--+PS3",
 
32
  "CC-",
33
- "CCONJ",
 
34
  "CD-",
 
35
  "CO-",
 
36
  "D--",
 
37
  "D--+PS3",
 
38
  "F--",
 
39
  "F--+PS2",
 
 
40
  "G--",
41
  "G--+PS3",
 
42
  "H--",
 
43
  "I--",
44
  "M--",
45
  "M--+PS3",
 
46
  "NOUN",
47
  "NPD",
 
 
48
  "NSD",
 
 
49
  "NSD+PS3",
 
50
  "NSF",
51
  "NSM",
 
52
  "NUM",
53
  "O--",
54
  "PP1",
 
55
  "PP2",
56
  "PP3",
 
57
  "PROPN",
58
  "PS1",
59
  "PS1+VSA",
 
60
  "PS2",
 
61
  "PS3",
 
62
  "R--",
 
 
63
  "R--+PS3",
64
  "S--",
65
- "SYM",
66
  "T--",
67
  "VERB",
68
  "VPA",
69
  "VSA",
 
70
  "VSA+PS2",
71
  "VSA+PS3",
 
72
  "VSP",
 
 
73
  "W--",
 
 
74
  "X--",
75
  "Z--"
76
  ],
77
  "morphologizer":[
78
  "POS=PROPN",
79
  "POS=AUX",
80
- "Definite=Ind|POS=DET|PronType=Art",
81
  "Number=Sing|POS=NOUN",
82
  "POS=PRON|PronType=Rel",
83
- "Mood=Ind|POS=VERB|Voice=Pass",
84
  "POS=ADP",
85
  "POS=PUNCT",
 
86
  "POS=NOUN",
87
  "POS=ADV",
88
  "POS=CCONJ",
89
- "POS=SCONJ",
90
- "Mood=Ind|POS=VERB|Voice=Act",
91
  "POS=VERB",
92
  "POS=DET|PronType=Tot",
93
- "Number=Sing|POS=PRON|Person=3|PronType=Prs",
 
94
  "Number=Plur|POS=PRON|Person=3|PronType=Prs",
95
- "POS=PRON|PronType=Prs|Reflex=Yes",
96
  "POS=DET|PronType=Dem",
97
  "NumType=Card|POS=NUM",
98
- "POS=ADJ",
99
- "Number=Plur|POS=DET|PronType=Ind",
100
- "NumType=Card|POS=NUM|PronType=Tot",
101
- "POS=PART|Polarity=Neg",
 
 
102
  "POS=PRON|PronType=Int",
103
- "NumType=Ord|POS=ADJ",
104
- "POS=PART",
 
 
 
 
 
105
  "POS=PRON|PronType=Dem",
106
- "POS=DET|PronType=Ind",
107
- "Number=Plur|POS=NOUN",
108
  "Number=Sing|POS=PRON|Person=1|Polite=Form|PronType=Prs",
 
 
 
109
  "POS=ADV|PronType=Int",
110
  "Clusivity=In|Number=Plur|POS=PRON|Person=1|PronType=Prs",
111
- "Definite=Def|POS=DET|PronType=Art",
112
- "POS=SYM",
113
- "Degree=Sup|POS=ADJ",
114
- "POS=INTJ",
 
 
 
 
 
 
 
 
 
 
 
 
115
  "Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs",
116
- "POS=ADV|PronType=Ind",
 
 
 
 
 
117
  "Number=Sing|POS=PRON|Person=3|Polite=Form|PronType=Prs",
118
- "Number=Sing|POS=PRON|Person=1|Polite=Infm|PronType=Prs",
119
- "Number=Sing|POS=PRON|PronType=Ind",
120
- "POS=VERB|Voice=Act",
121
- "POS=DET|PronType=Emp",
122
- "POS=VERB|Voice=Pass",
 
 
 
 
 
 
 
 
123
  "POS=ADV|PronType=Dem",
124
- "POS=NOUN|Typo=Yes",
125
- "POS=ADP|Typo=Yes",
126
- "Number=Plur|POS=PRON|PronType=Ind",
127
- "POS=VERB|Typo=Yes|Voice=Pass",
128
- "POS=X",
 
 
 
 
 
 
 
 
 
129
  "POS=PRON|PronType=Tot",
130
- "POS=SCONJ|Typo=Yes",
131
- "Number=Plur|POS=PRON|Person=2|Polite=Infm|PronType=Prs",
132
- "NumType=Card|POS=NUM|Typo=Yes",
 
 
 
 
 
 
133
  "Clusivity=Ex|Number=Plur|POS=PRON|Person=1|PronType=Prs",
 
 
 
 
 
 
134
  "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs",
135
- "Foreign=Yes|POS=X",
136
- "POS=ADV|PronType=Rel",
137
- "Mood=Imp|POS=VERB|Voice=Act",
138
- "Number=Sing|POS=NOUN|Typo=Yes",
139
- "POS=PROPN|Typo=Yes",
140
- "POS=DET",
141
- "Number=Sing|POS=DET|PronType=Ind",
142
- "POS=DET|PronType=Ind|Typo=Yes",
143
- "Abbr=Yes|POS=DET|PronType=Dem",
144
- "POS=PRON|PronType=Ind",
145
- "POS=VERB|Typo=Yes",
146
- "Abbr=Yes|POS=PROPN",
147
- "Abbr=Yes|POS=PRON|PronType=Rel",
148
- "Number=Plur|POS=PRON|PronType=Int",
149
- "Abbr=Yes|POS=PART|Polarity=Neg",
150
- "POS=ADV|PronType=Tot",
151
- "Abbr=Yes|POS=ADV",
152
- "POS=ADV|Typo=Yes",
153
- "POS=X|Typo=Yes",
 
 
 
 
 
 
 
 
 
 
 
154
  "Number=Sing|POS=PRON|Person=2|PronType=Prs",
155
- "POS=ADV|PronType=Int|Typo=Yes",
156
- "NumType=Ord|POS=ADJ|Typo=Yes"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
157
  ],
158
  "parser":[
159
  "ROOT",
160
  "acl",
161
- "acl:relcl",
162
  "advcl",
163
  "advmod",
164
- "advmod:emph",
165
  "amod",
166
  "appos",
167
- "aux",
168
  "case",
169
- "case:adv",
170
  "cc",
171
  "ccomp",
172
  "compound",
 
173
  "conj",
174
  "cop",
175
  "dep",
176
  "det",
177
  "fixed",
178
  "flat",
179
- "flat:foreign",
180
- "flat:name",
181
  "mark",
182
  "nmod",
183
- "nmod:lmod",
184
- "nmod:poss",
185
- "nmod:tmod",
186
  "nsubj",
187
  "nsubj:pass",
188
  "nummod",
189
  "obj",
190
  "obl",
191
- "obl:agent",
192
- "obl:tmod",
193
  "parataxis",
194
  "punct",
195
  "xcomp"
@@ -215,268 +369,299 @@
215
 
216
  ],
217
  "performance":{
218
- "ents_f":0.0,
219
- "ents_p":0.0,
220
- "ents_r":0.0,
221
- "ents_per_type":0.0,
222
- "tag_acc":0.9058429775,
223
- "pos_acc":0.911077953,
224
- "morph_acc":0.924529063,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
225
  "morph_per_feat":{
226
  "Number":{
227
- "p":0.978250591,
228
- "r":0.8123282293,
229
- "f":0.8876018876
230
- },
231
- "Mood":{
232
- "p":0.9941520468,
233
- "r":0.9147982063,
234
- "f":0.9528257823
235
  },
236
  "Voice":{
237
- "p":0.9902723735,
238
- "r":0.9113697404,
239
- "f":0.9491841492
240
  },
241
  "PronType":{
242
- "p":0.991576414,
243
- "r":0.7795648061,
244
- "f":0.8728813559
245
  },
246
  "Polarity":{
247
  "p":1.0,
248
- "r":0.862745098,
249
- "f":0.9263157895
250
  },
251
- "Person":{
252
- "p":1.0,
253
- "r":0.3973509934,
254
- "f":0.5687203791
255
  },
256
  "NumType":{
257
- "p":0.9952718676,
258
- "r":0.9503386005,
259
- "f":0.9722863741
260
  },
261
- "Typo":{
262
  "p":1.0,
263
- "r":0.4666666667,
264
- "f":0.6363636364
265
  },
266
- "Definite":{
267
- "p":0.9838709677,
268
- "r":0.7922077922,
269
- "f":0.8776978417
 
 
 
 
 
270
  },
271
  "Polite":{
272
  "p":1.0,
273
- "r":0.65625,
274
- "f":0.7924528302
275
  },
276
- "Reflex":{
277
  "p":1.0,
278
- "r":0.5,
279
- "f":0.6666666667
280
- },
281
- "Degree":{
282
- "p":0.9375,
283
- "r":0.8823529412,
284
- "f":0.9090909091
285
- },
286
- "Foreign":{
287
- "p":0.0,
288
- "r":0.0,
289
- "f":0.0
290
  },
291
  "Clusivity":{
292
  "p":1.0,
293
  "r":1.0,
294
  "f":1.0
295
- },
296
- "Abbr":{
297
- "p":1.0,
298
- "r":0.2,
299
- "f":0.3333333333
300
  }
301
  },
302
- "lemma_acc":0.9356240444,
303
- "dep_uas":0.779082277,
304
- "dep_las":0.6971807939,
305
  "dep_las_per_type":{
306
  "nsubj":{
307
- "p":0.8022759602,
308
- "r":0.7621621622,
309
- "f":0.7817047817
310
  },
311
  "compound":{
312
- "p":0.6970849176,
313
- "r":0.6988564168,
314
- "f":0.6979695431
315
  },
316
  "root":{
317
- "p":0.8139963168,
318
- "r":0.7906976744,
319
- "f":0.8021778584
320
  },
321
  "obj":{
322
- "p":0.8152985075,
323
- "r":0.7613240418,
324
- "f":0.7873873874
325
  },
326
  "case":{
327
- "p":0.9104609929,
328
- "r":0.8868739206,
329
- "f":0.8985126859
330
  },
331
  "obl":{
332
- "p":0.7344322344,
333
- "r":0.6178736518,
334
- "f":0.6711297071
335
  },
336
  "amod":{
337
- "p":0.6195899772,
338
- "r":0.590021692,
339
- "f":0.6044444444
340
  },
341
  "conj":{
342
- "p":0.5868263473,
343
- "r":0.5485074627,
344
- "f":0.5670202507
345
  },
346
  "cc":{
347
- "p":0.880239521,
348
- "r":0.8376068376,
349
- "f":0.8583941606
350
  },
351
- "acl:relcl":{
352
- "p":0.7262357414,
353
- "r":0.6821428571,
354
- "f":0.7034990792
355
  },
356
- "flat:name":{
357
- "p":0.7844036697,
358
- "r":0.8123515439,
359
- "f":0.7981330222
360
  },
361
  "advmod":{
362
- "p":0.7588075881,
363
- "r":0.6982543641,
364
- "f":0.7272727273
365
  },
366
  "nmod":{
367
- "p":0.613836478,
368
- "r":0.5816448153,
369
- "f":0.5973072215
370
  },
371
  "nsubj:pass":{
372
- "p":0.7100840336,
373
- "r":0.7824074074,
374
- "f":0.7444933921
375
  },
376
  "det":{
377
- "p":0.8545454545,
378
- "r":0.7943661972,
379
- "f":0.8233576642
380
- },
381
- "aux":{
382
- "p":0.9461538462,
383
- "r":0.9179104478,
384
- "f":0.9318181818
385
- },
386
- "nmod:poss":{
387
- "p":0.8235294118,
388
- "r":0.0848484848,
389
- "f":0.1538461538
390
  },
391
  "dep":{
392
- "p":0.2394366197,
393
- "r":0.3035714286,
394
- "f":0.2677165354
 
 
 
 
 
395
  },
396
  "mark":{
397
- "p":0.8018018018,
398
- "r":0.7542372881,
399
- "f":0.7772925764
400
  },
401
  "cop":{
402
- "p":0.9607843137,
403
  "r":0.9423076923,
404
- "f":0.9514563107
405
- },
406
- "acl":{
407
- "p":0.3048780488,
408
- "r":0.2232142857,
409
- "f":0.2577319588
410
  },
411
  "nummod":{
412
- "p":0.7768817204,
413
- "r":0.7747989276,
414
- "f":0.7758389262
415
  },
416
  "appos":{
417
- "p":0.6460176991,
418
- "r":0.553030303,
419
- "f":0.5959183673
420
  },
421
  "xcomp":{
422
- "p":0.4495412844,
423
- "r":0.392,
424
- "f":0.4188034188
425
  },
426
  "ccomp":{
427
- "p":0.4571428571,
428
- "r":0.3265306122,
429
- "f":0.380952381
430
- },
431
- "obl:tmod":{
432
- "p":0.6029411765,
433
- "r":0.6721311475,
434
- "f":0.6356589147
435
  },
436
  "advcl":{
437
- "p":0.268907563,
438
- "r":0.2269503546,
439
- "f":0.2461538462
440
- },
441
- "advmod:emph":{
442
- "p":1.0,
443
- "r":0.0434782609,
444
- "f":0.0833333333
445
- },
446
- "case:adv":{
447
- "p":0.7272727273,
448
- "r":0.6153846154,
449
- "f":0.6666666667
450
- },
451
- "obl:agent":{
452
- "p":0.0,
453
- "r":0.0,
454
- "f":0.0
455
  },
456
- "flat":{
457
- "p":0.4375,
458
- "r":0.3255813953,
459
- "f":0.3733333333
460
  },
461
  "parataxis":{
462
- "p":0.2253521127,
463
- "r":0.3265306122,
464
- "f":0.2666666667
465
- },
466
- "nmod:lmod":{
467
- "p":1.0,
468
- "r":0.0769230769,
469
- "f":0.1428571429
470
- },
471
- "flat:foreign":{
472
- "p":0.0,
473
- "r":0.0,
474
- "f":0.0
475
- },
476
- "nmod:tmod":{
477
- "p":0.3333333333,
478
- "r":0.2727272727,
479
- "f":0.3
480
  },
481
  "iobj":{
482
  "p":0.0,
@@ -487,37 +672,17 @@
487
  "p":0.0,
488
  "r":0.0,
489
  "f":0.0
490
- },
491
- "fixed":{
492
- "p":0.6,
493
- "r":0.3461538462,
494
- "f":0.4390243902
495
- },
496
- "discourse":{
497
- "p":0.0,
498
- "r":0.0,
499
- "f":0.0
500
- },
501
- "cc:preconj":{
502
- "p":0.0,
503
- "r":0.0,
504
- "f":0.0
505
- },
506
- "compound:a":{
507
- "p":0.0,
508
- "r":0.0,
509
- "f":0.0
510
  }
511
  },
512
- "sents_p":0.9074733096,
513
- "sents_r":0.9123434705,
514
- "sents_f":0.9099018733,
515
- "tok2vec_loss":8342.1316462817,
516
- "ner_loss":0.0,
517
- "tagger_loss":572.1505841613,
518
- "morphologizer_loss":1246.6148492694,
519
- "trainable_lemmatizer_loss":245.6071262917,
520
- "parser_loss":8829.155590333
521
  },
522
  "requirements":[
523
 
 
1
  {
2
  "lang":"id",
3
  "name":"core_news_sm",
4
+ "version":"0.0.3",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
+ "spacy_version":">=3.7.0,<3.8.0",
11
+ "spacy_git_version":"160e61772",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
20
 
21
  ],
22
  "ner":[
23
+ "CARDINAL",
24
+ "DATE",
25
+ "EVENT",
26
+ "FAC",
27
+ "GPE",
28
+ "LANGUAGE",
29
+ "LAW",
30
+ "LOC",
31
+ "MONEY",
32
+ "NORP",
33
+ "ORDINAL",
34
+ "ORG",
35
+ "PERCENT",
36
+ "PERSON",
37
+ "PRODUCT",
38
+ "QUANTITY",
39
+ "TIME",
40
+ "WORK_OF_ART"
41
  ],
42
  "tagger":[
43
  "APP",
44
  "ASP",
45
+ "ASP+PS2",
46
  "ASP+PS3",
47
+ "ASP+T--",
48
  "ASS",
49
+ "ASS+PS3",
50
  "B--",
51
  "B--+PS3",
52
+ "B--+T--",
53
  "CC-",
54
+ "CC-+PS3",
55
+ "CC-+T--",
56
  "CD-",
57
+ "CD-+PS3",
58
  "CO-",
59
+ "CO-+PS3",
60
  "D--",
61
+ "D--+PS2",
62
  "D--+PS3",
63
+ "D--+T--",
64
  "F--",
65
+ "F--+PS1",
66
  "F--+PS2",
67
+ "F--+PS3",
68
+ "F--+T--",
69
  "G--",
70
  "G--+PS3",
71
+ "G--+T--",
72
  "H--",
73
+ "H--+T--",
74
  "I--",
75
  "M--",
76
  "M--+PS3",
77
+ "M--+T--",
78
  "NOUN",
79
  "NPD",
80
+ "NPD+PS2",
81
+ "NPD+PS3",
82
  "NSD",
83
+ "NSD+PS1",
84
+ "NSD+PS2",
85
  "NSD+PS3",
86
+ "NSD+T--",
87
  "NSF",
88
  "NSM",
89
+ "NSM+PS3",
90
  "NUM",
91
  "O--",
92
  "PP1",
93
+ "PP1+T--",
94
  "PP2",
95
  "PP3",
96
+ "PP3+T--",
97
  "PROPN",
98
  "PS1",
99
  "PS1+VSA",
100
+ "PS1+VSA+T--",
101
  "PS2",
102
+ "PS2+VSA",
103
  "PS3",
104
+ "PUNCT",
105
  "R--",
106
+ "R--+PS1",
107
+ "R--+PS2",
108
  "R--+PS3",
109
  "S--",
110
+ "S--+PS3",
111
  "T--",
112
  "VERB",
113
  "VPA",
114
  "VSA",
115
+ "VSA+PS1",
116
  "VSA+PS2",
117
  "VSA+PS3",
118
+ "VSA+T--",
119
  "VSP",
120
+ "VSP+PS3",
121
+ "VSP+T--",
122
  "W--",
123
+ "W--+T--",
124
+ "X",
125
  "X--",
126
  "Z--"
127
  ],
128
  "morphologizer":[
129
  "POS=PROPN",
130
  "POS=AUX",
131
+ "POS=DET|PronType=Ind",
132
  "Number=Sing|POS=NOUN",
133
  "POS=PRON|PronType=Rel",
134
+ "Number=Sing|POS=VERB|Voice=Pass",
135
  "POS=ADP",
136
  "POS=PUNCT",
137
+ "Number=Sing|POS=PROPN",
138
  "POS=NOUN",
139
  "POS=ADV",
140
  "POS=CCONJ",
141
+ "Number=Sing|POS=VERB|Voice=Act",
 
142
  "POS=VERB",
143
  "POS=DET|PronType=Tot",
144
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3",
145
+ "POS=SCONJ",
146
  "Number=Plur|POS=PRON|Person=3|PronType=Prs",
 
147
  "POS=DET|PronType=Dem",
148
  "NumType=Card|POS=NUM",
149
+ "Degree=Pos|Number=Sing|POS=NOUN",
150
+ "Degree=Pos|Number=Sing|POS=ADJ",
151
+ "NumType=Card|POS=DET|PronType=Ind",
152
+ "Degree=Pos|Number=Sing|POS=ADP",
153
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=3",
154
+ "Number=Sing|POS=VERB",
155
  "POS=PRON|PronType=Int",
156
+ "Number=Sing|POS=ADV|Voice=Act",
157
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3|Voice=Act",
158
+ "Number=Sing|POS=ADP|Voice=Act",
159
+ "POS=ADJ",
160
+ "Number[psor]=Sing|POS=ADP|Person[psor]=3",
161
+ "Degree=Pos|Number=Sing|POS=DET",
162
+ "Degree=Pos|Number=Sing|POS=VERB",
163
  "POS=PRON|PronType=Dem",
164
+ "POS=PART|Polarity=Neg",
165
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3",
166
  "Number=Sing|POS=PRON|Person=1|Polite=Form|PronType=Prs",
167
+ "Number=Sing|POS=ADJ",
168
+ "Number=Sing|POS=PRON|Person=3|PronType=Prs",
169
+ "POS=SYM",
170
  "POS=ADV|PronType=Int",
171
  "Clusivity=In|Number=Plur|POS=PRON|Person=1|PronType=Prs",
172
+ "Number=Sing|POS=ADJ|Voice=Act",
173
+ "Degree=Pos|Number=Sing|POS=PROPN",
174
+ "Degree=Pos|Number=Sing|POS=ADV",
175
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3|Voice=Pass",
176
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3|Voice=Act",
177
+ "Number=Sing|POS=PROPN|Voice=Act",
178
+ "Number=Sing|POS=NOUN|Voice=Act",
179
+ "POS=DET",
180
+ "Number=Sing|POS=DET|Voice=Act",
181
+ "NumType=Card|POS=PRON|PronType=Ind",
182
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3",
183
+ "Number=Sing|POS=DET",
184
+ "Number=Sing|POS=ADJ|Voice=Pass",
185
+ "POS=CCONJ|PronType=Dem",
186
+ "Number=Sing|POS=ADP",
187
+ "Number=Sing|POS=ADV",
188
  "Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs",
189
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=2",
190
+ "Number=Plur|Number[psor]=Sing|POS=NOUN|Person[psor]=2",
191
+ "Number=Sing|POS=PRON",
192
+ "POS=PRON",
193
+ "NumType=Card|POS=ADV|PronType=Ind",
194
+ "NumType=Card|Number[psor]=Sing|POS=NUM|Person[psor]=3",
195
  "Number=Sing|POS=PRON|Person=3|Polite=Form|PronType=Prs",
196
+ "POS=DET|PronType=Int",
197
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3",
198
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=1",
199
+ "Degree=Pos|Number=Sing|POS=SCONJ",
200
+ "POS=PRON|PronType=Ind",
201
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3|Voice=Pass",
202
+ "POS=VERB|PronType=Ind",
203
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3",
204
+ "Number=Sing|POS=SCONJ",
205
+ "Degree=Sup|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3",
206
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3",
207
+ "Number=Plur|Number[psor]=Sing|POS=NOUN|Person[psor]=3",
208
+ "Number=Plur|POS=NOUN",
209
  "POS=ADV|PronType=Dem",
210
+ "Number=Sing|POS=VERB|Person=1|Voice=Act",
211
+ "Degree=Sup|Number=Sing|POS=ADJ",
212
+ "Number=Sing|POS=ADP|Voice=Pass",
213
+ "Number[psor]=Sing|POS=PART|Person[psor]=3",
214
+ "Number=Sing|POS=NOUN|Voice=Pass",
215
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=CCONJ|Person[psor]=3",
216
+ "POS=PART",
217
+ "Number=Sing|Number[psor]=Sing|POS=PART|Person[psor]=3|Voice=Pass",
218
+ "Degree=Sup|Number=Sing|POS=ADV",
219
+ "Number=Sing|POS=PRON|Voice=Act",
220
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3|Voice=Act",
221
+ "Gender=Masc|Number=Sing|POS=PROPN",
222
+ "Number[psor]=Sing|POS=PRON|Person[psor]=3|PronType=Tot",
223
+ "Degree=Pos|Number=Sing|POS=X",
224
  "POS=PRON|PronType=Tot",
225
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3",
226
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3",
227
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3",
228
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=2",
229
+ "POS=SCONJ|PronType=Int",
230
+ "Number=Plur|POS=PRON|Person=2|PronType=Prs",
231
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=1|Voice=Act",
232
+ "Number[psor]=Sing|POS=DET|Person[psor]=3",
233
+ "Number=Sing|Number[psor]=Sing|POS=PRON|Person[psor]=3",
234
  "Clusivity=Ex|Number=Plur|POS=PRON|Person=1|PronType=Prs",
235
+ "Number=Plur|POS=VERB|Voice=Act",
236
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3|Voice=Act",
237
+ "Degree=Pos|Number=Sing|POS=NOUN|Polarity=Neg",
238
+ "POS=X",
239
+ "Number[psor]=Sing|POS=ADJ|Person[psor]=3",
240
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3",
241
  "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs",
242
+ "Number=Sing|POS=PRON|Person=1|Polite=Infm|PronType=Prs",
243
+ "Number=Sing|POS=PROPN|Voice=Pass",
244
+ "POS=ADV|Polarity=Neg",
245
+ "NumType=Card|Number=Sing|POS=NUM",
246
+ "Number[psor]=Sing|POS=ADV|Person[psor]=2",
247
+ "Number[psor]=Sing|POS=ADV|Person[psor]=3",
248
+ "Degree=Sup|Number=Sing|POS=PROPN",
249
+ "POS=PROPN|Polarity=Neg",
250
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=2|Voice=Act",
251
+ "Number=Sing|POS=PROPN|Person=1|Voice=Act",
252
+ "POS=SCONJ|PronType=Dem",
253
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=2|Voice=Act",
254
+ "Number=Sing|POS=CCONJ",
255
+ "Degree=Sup|Number=Sing|POS=VERB",
256
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3",
257
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3|Voice=Act",
258
+ "Degree=Pos|Number=Sing|POS=PRON",
259
+ "Number=Sing|POS=ADV|Voice=Pass",
260
+ "Number[psor]=Sing|POS=ADP|Person[psor]=2",
261
+ "Number=Sing|POS=SYM",
262
+ "POS=ADJ|Polarity=Neg",
263
+ "Degree=Pos|NumType=Card|Number=Sing|POS=NUM",
264
+ "Number=Sing|Number[psor]=Sing|POS=SCONJ|Person[psor]=3",
265
+ "Degree=Pos|Number=Sing|POS=CCONJ",
266
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=1",
267
+ "Number=Sing|POS=CCONJ|Voice=Act",
268
+ "Gender=Masc|Number=Sing|POS=NOUN",
269
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3|Voice=Pass",
270
+ "Gender=Fem|Number=Sing|POS=PROPN",
271
+ "POS=VERB|PronType=Dem",
272
  "Number=Sing|POS=PRON|Person=2|PronType=Prs",
273
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3",
274
+ "Number=Sing|POS=PART|Voice=Act",
275
+ "Degree=Sup|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3",
276
+ "POS=ADP|PronType=Int",
277
+ "Number[psor]=Sing|POS=VERB|Person[psor]=3",
278
+ "Number[psor]=Sing|POS=PRON|Person[psor]=3|PronType=Rel",
279
+ "Degree=Pos|Number=Sing|POS=AUX",
280
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=1",
281
+ "Number=Sing|POS=SCONJ|Voice=Pass",
282
+ "Degree=Sup|Number=Sing|POS=ADP",
283
+ "Number=Sing|POS=SCONJ|Voice=Act",
284
+ "NumType=Card|POS=DET|PronType=Int",
285
+ "Degree=Pos|Number=Sing|POS=PART|Polarity=Neg",
286
+ "Degree=Sup|Number=Sing|POS=SCONJ",
287
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=1|Voice=Act",
288
+ "Number=Plur|POS=ADJ",
289
+ "POS=VERB|PronType=Int",
290
+ "Number=Sing|POS=VERB|Person=2|Voice=Act",
291
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=2",
292
+ "Gender=Masc|Number=Sing|POS=ADJ",
293
+ "Number[psor]=Sing|POS=ADV|Person[psor]=3|PronType=Tot",
294
+ "POS=DET|PronType=Rel",
295
+ "Number=Sing|POS=NOUN|Polarity=Neg",
296
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=2",
297
+ "NumType=Card|Number=Sing|POS=NUM|Voice=Act",
298
+ "Degree=Pos|Number=Plur|POS=ADJ",
299
+ "Number[psor]=Sing|POS=DET|Person[psor]=3|PronType=Tot",
300
+ "Number[psor]=Sing|POS=PROPN|Person[psor]=1",
301
+ "Gender=Fem|Number=Sing|POS=NOUN",
302
+ "Number=Sing|POS=VERB|Person=1",
303
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3",
304
+ "NumType=Card|Number[psor]=Sing|POS=DET|Person[psor]=3|PronType=Ind",
305
+ "POS=ADV|PronType=Tot",
306
+ "Degree=Pos|Number=Plur|POS=ADV",
307
+ "Number=Plur|POS=ADV|Voice=Act",
308
+ "POS=CCONJ|PronType=Int",
309
+ "Degree=Pos|Number=Sing|POS=PART",
310
+ "Number[psor]=Sing|POS=PRON|Person[psor]=2",
311
+ "Number=Plur|POS=VERB",
312
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3|Voice=Pass",
313
+ "Degree=Pos|Number=Sing|POS=PUNCT",
314
+ "Number[psor]=Sing|POS=ADP|Person[psor]=1",
315
+ "Degree=Sup|Number=Sing|POS=NOUN",
316
+ "Number[psor]=Sing|POS=PART|Person[psor]=3|Polarity=Neg",
317
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3|Voice=Act",
318
+ "POS=NOUN|Polarity=Neg",
319
+ "Number[psor]=Sing|POS=PROPN|Person[psor]=2",
320
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=2|Voice=Act"
321
  ],
322
  "parser":[
323
  "ROOT",
324
  "acl",
 
325
  "advcl",
326
  "advmod",
 
327
  "amod",
328
  "appos",
 
329
  "case",
 
330
  "cc",
331
  "ccomp",
332
  "compound",
333
+ "compound:plur",
334
  "conj",
335
  "cop",
336
  "dep",
337
  "det",
338
  "fixed",
339
  "flat",
 
 
340
  "mark",
341
  "nmod",
 
 
 
342
  "nsubj",
343
  "nsubj:pass",
344
  "nummod",
345
  "obj",
346
  "obl",
 
 
347
  "parataxis",
348
  "punct",
349
  "xcomp"
 
369
 
370
  ],
371
  "performance":{
372
+ "ents_f":0.7092271905,
373
+ "ents_p":0.7083118224,
374
+ "ents_r":0.7101449275,
375
+ "ents_per_type":{
376
+ "PRODUCT":{
377
+ "p":0.5909090909,
378
+ "r":0.4482758621,
379
+ "f":0.5098039216
380
+ },
381
+ "GPE":{
382
+ "p":0.8341968912,
383
+ "r":0.8363636364,
384
+ "f":0.8352788586
385
+ },
386
+ "FAC":{
387
+ "p":0.5,
388
+ "r":0.4259259259,
389
+ "f":0.46
390
+ },
391
+ "PERSON":{
392
+ "p":0.6575,
393
+ "r":0.6902887139,
394
+ "f":0.6734955186
395
+ },
396
+ "ORG":{
397
+ "p":0.609929078,
398
+ "r":0.4699453552,
399
+ "f":0.5308641975
400
+ },
401
+ "WORK_OF_ART":{
402
+ "p":0.2181818182,
403
+ "r":0.375,
404
+ "f":0.275862069
405
+ },
406
+ "LAW":{
407
+ "p":0.5555555556,
408
+ "r":0.6730769231,
409
+ "f":0.6086956522
410
+ },
411
+ "DATE":{
412
+ "p":0.8333333333,
413
+ "r":0.8387096774,
414
+ "f":0.8360128617
415
+ },
416
+ "ORDINAL":{
417
+ "p":0.9429824561,
418
+ "r":0.9684684685,
419
+ "f":0.9555555556
420
+ },
421
+ "CARDINAL":{
422
+ "p":0.8,
423
+ "r":0.8717948718,
424
+ "f":0.8343558282
425
+ },
426
+ "EVENT":{
427
+ "p":0.4155844156,
428
+ "r":0.4705882353,
429
+ "f":0.4413793103
430
+ },
431
+ "QUANTITY":{
432
+ "p":0.4347826087,
433
+ "r":0.5263157895,
434
+ "f":0.4761904762
435
+ },
436
+ "LOC":{
437
+ "p":0.564516129,
438
+ "r":0.5737704918,
439
+ "f":0.5691056911
440
+ },
441
+ "NORP":{
442
+ "p":0.7746478873,
443
+ "r":0.7236842105,
444
+ "f":0.7482993197
445
+ },
446
+ "PERCENT":{
447
+ "p":0.7777777778,
448
+ "r":0.7777777778,
449
+ "f":0.7777777778
450
+ },
451
+ "TIME":{
452
+ "p":0.6666666667,
453
+ "r":0.6666666667,
454
+ "f":0.6666666667
455
+ },
456
+ "LANGUAGE":{
457
+ "p":0.75,
458
+ "r":0.7894736842,
459
+ "f":0.7692307692
460
+ },
461
+ "MONEY":{
462
+ "p":0.0,
463
+ "r":0.0,
464
+ "f":0.0
465
+ }
466
+ },
467
+ "tag_acc":0.924552227,
468
+ "pos_acc":0.9237476221,
469
+ "morph_acc":0.9444730688,
470
  "morph_per_feat":{
471
  "Number":{
472
+ "p":0.9930514195,
473
+ "r":0.9632197189,
474
+ "f":0.9779081134
 
 
 
 
 
475
  },
476
  "Voice":{
477
+ "p":0.9679230152,
478
+ "r":0.9414976599,
479
+ "f":0.9545274812
480
  },
481
  "PronType":{
482
+ "p":0.9815498155,
483
+ "r":0.9602888087,
484
+ "f":0.9708029197
485
  },
486
  "Polarity":{
487
  "p":1.0,
488
+ "r":0.8846153846,
489
+ "f":0.9387755102
490
  },
491
+ "Degree":{
492
+ "p":0.9647435897,
493
+ "r":0.8478873239,
494
+ "f":0.9025487256
495
  },
496
  "NumType":{
497
+ "p":0.9622641509,
498
+ "r":0.9293849658,
499
+ "f":0.9455388181
500
  },
501
+ "Person":{
502
  "p":1.0,
503
+ "r":0.9193548387,
504
+ "f":0.9579831933
505
  },
506
+ "Number[psor]":{
507
+ "p":0.9946524064,
508
+ "r":0.9441624365,
509
+ "f":0.96875
510
+ },
511
+ "Person[psor]":{
512
+ "p":0.9893048128,
513
+ "r":0.9390862944,
514
+ "f":0.9635416667
515
  },
516
  "Polite":{
517
  "p":1.0,
518
+ "r":0.9090909091,
519
+ "f":0.9523809524
520
  },
521
+ "Gender":{
522
  "p":1.0,
523
+ "r":0.75,
524
+ "f":0.8571428571
 
 
 
 
 
 
 
 
 
 
525
  },
526
  "Clusivity":{
527
  "p":1.0,
528
  "r":1.0,
529
  "f":1.0
 
 
 
 
 
530
  }
531
  },
532
+ "lemma_acc":0.9719515094,
533
+ "dep_uas":0.817370892,
534
+ "dep_las":0.7299441393,
535
  "dep_las_per_type":{
536
  "nsubj":{
537
+ "p":0.7940780619,
538
+ "r":0.7898259705,
539
+ "f":0.7919463087
540
  },
541
  "compound":{
542
+ "p":0.6948356808,
543
+ "r":0.7390761548,
544
+ "f":0.7162734422
545
  },
546
  "root":{
547
+ "p":0.7902946274,
548
+ "r":0.8157423971,
549
+ "f":0.8028169014
550
  },
551
  "obj":{
552
+ "p":0.796460177,
553
+ "r":0.7908611599,
554
+ "f":0.7936507937
555
  },
556
  "case":{
557
+ "p":0.9110751819,
558
+ "r":0.9103392569,
559
+ "f":0.9107070707
560
  },
561
  "obl":{
562
+ "p":0.6636713736,
563
+ "r":0.7762762763,
564
+ "f":0.7155709343
565
  },
566
  "amod":{
567
+ "p":0.6194174757,
568
+ "r":0.6392785571,
569
+ "f":0.6291913215
570
  },
571
  "conj":{
572
+ "p":0.5516528926,
573
+ "r":0.5095419847,
574
+ "f":0.5297619048
575
  },
576
  "cc":{
577
+ "p":0.8366762178,
578
+ "r":0.8156424581,
579
+ "f":0.8260254597
580
  },
581
+ "acl":{
582
+ "p":0.6510791367,
583
+ "r":0.5307917889,
584
+ "f":0.5848142165
585
  },
586
+ "flat":{
587
+ "p":0.7840909091,
588
+ "r":0.8284734134,
589
+ "f":0.8056713928
590
  },
591
  "advmod":{
592
+ "p":0.770398482,
593
+ "r":0.7883495146,
594
+ "f":0.7792706334
595
  },
596
  "nmod":{
597
+ "p":0.5913978495,
598
+ "r":0.4782608696,
599
+ "f":0.5288461538
600
  },
601
  "nsubj:pass":{
602
+ "p":0.736318408,
603
+ "r":0.6820276498,
604
+ "f":0.7081339713
605
  },
606
  "det":{
607
+ "p":0.8005050505,
608
+ "r":0.7171945701,
609
+ "f":0.7565632458
 
 
 
 
 
 
 
 
 
 
610
  },
611
  "dep":{
612
+ "p":0.2790697674,
613
+ "r":0.1935483871,
614
+ "f":0.2285714286
615
+ },
616
+ "fixed":{
617
+ "p":0.6888888889,
618
+ "r":0.5438596491,
619
+ "f":0.6078431373
620
  },
621
  "mark":{
622
+ "p":0.6585365854,
623
+ "r":0.6315789474,
624
+ "f":0.6447761194
625
  },
626
  "cop":{
627
+ "p":0.9423076923,
628
  "r":0.9423076923,
629
+ "f":0.9423076923
 
 
 
 
 
630
  },
631
  "nummod":{
632
+ "p":0.7443438914,
633
+ "r":0.7615740741,
634
+ "f":0.7528604119
635
  },
636
  "appos":{
637
+ "p":0.5243055556,
638
+ "r":0.5634328358,
639
+ "f":0.5431654676
640
  },
641
  "xcomp":{
642
+ "p":0.465648855,
643
+ "r":0.4692307692,
644
+ "f":0.4674329502
645
  },
646
  "ccomp":{
647
+ "p":0.3529411765,
648
+ "r":0.1132075472,
649
+ "f":0.1714285714
 
 
 
 
 
650
  },
651
  "advcl":{
652
+ "p":0.3109756098,
653
+ "r":0.3541666667,
654
+ "f":0.3311688312
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
655
  },
656
+ "compound:plur":{
657
+ "p":0.8823529412,
658
+ "r":0.8695652174,
659
+ "f":0.8759124088
660
  },
661
  "parataxis":{
662
+ "p":0.2380952381,
663
+ "r":0.4255319149,
664
+ "f":0.3053435115
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
665
  },
666
  "iobj":{
667
  "p":0.0,
 
672
  "p":0.0,
673
  "r":0.0,
674
  "f":0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
675
  }
676
  },
677
+ "sents_p":0.87694974,
678
+ "sents_r":0.9051878354,
679
+ "sents_f":0.8908450704,
680
+ "tok2vec_loss":12977.2743123164,
681
+ "ner_loss":966.7057275135,
682
+ "tagger_loss":563.7818157673,
683
+ "morphologizer_loss":1648.5834716558,
684
+ "trainable_lemmatizer_loss":166.4619438377,
685
+ "parser_loss":9300.4593325223
686
  },
687
  "requirements":[
688
 
morphologizer/cfg CHANGED
@@ -4,164 +4,390 @@
4
  "labels_morph":{
5
  "POS=PROPN":"",
6
  "POS=AUX":"",
7
- "Definite=Ind|POS=DET|PronType=Art":"Definite=Ind|PronType=Art",
8
  "Number=Sing|POS=NOUN":"Number=Sing",
9
  "POS=PRON|PronType=Rel":"PronType=Rel",
10
- "Mood=Ind|POS=VERB|Voice=Pass":"Mood=Ind|Voice=Pass",
11
  "POS=ADP":"",
12
  "POS=PUNCT":"",
 
13
  "POS=NOUN":"",
14
  "POS=ADV":"",
15
  "POS=CCONJ":"",
16
- "POS=SCONJ":"",
17
- "Mood=Ind|POS=VERB|Voice=Act":"Mood=Ind|Voice=Act",
18
  "POS=VERB":"",
19
  "POS=DET|PronType=Tot":"PronType=Tot",
20
- "Number=Sing|POS=PRON|Person=3|PronType=Prs":"Number=Sing|Person=3|PronType=Prs",
 
21
  "Number=Plur|POS=PRON|Person=3|PronType=Prs":"Number=Plur|Person=3|PronType=Prs",
22
- "POS=PRON|PronType=Prs|Reflex=Yes":"PronType=Prs|Reflex=Yes",
23
  "POS=DET|PronType=Dem":"PronType=Dem",
24
  "NumType=Card|POS=NUM":"NumType=Card",
25
- "POS=ADJ":"",
26
- "Number=Plur|POS=DET|PronType=Ind":"Number=Plur|PronType=Ind",
27
- "NumType=Card|POS=NUM|PronType=Tot":"NumType=Card|PronType=Tot",
28
- "POS=PART|Polarity=Neg":"Polarity=Neg",
 
 
29
  "POS=PRON|PronType=Int":"PronType=Int",
30
- "NumType=Ord|POS=ADJ":"NumType=Ord",
31
- "POS=PART":"",
 
 
 
 
 
32
  "POS=PRON|PronType=Dem":"PronType=Dem",
33
- "POS=DET|PronType=Ind":"PronType=Ind",
34
- "Number=Plur|POS=NOUN":"Number=Plur",
35
  "Number=Sing|POS=PRON|Person=1|Polite=Form|PronType=Prs":"Number=Sing|Person=1|Polite=Form|PronType=Prs",
 
 
 
36
  "POS=ADV|PronType=Int":"PronType=Int",
37
  "Clusivity=In|Number=Plur|POS=PRON|Person=1|PronType=Prs":"Clusivity=In|Number=Plur|Person=1|PronType=Prs",
38
- "Definite=Def|POS=DET|PronType=Art":"Definite=Def|PronType=Art",
39
- "POS=SYM":"",
40
- "Degree=Sup|POS=ADJ":"Degree=Sup",
41
- "POS=INTJ":"",
 
 
 
 
 
 
 
 
 
 
 
 
42
  "Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs":"Number=Sing|Person=2|Polite=Infm|PronType=Prs",
43
- "POS=ADV|PronType=Ind":"PronType=Ind",
 
 
 
 
 
44
  "Number=Sing|POS=PRON|Person=3|Polite=Form|PronType=Prs":"Number=Sing|Person=3|Polite=Form|PronType=Prs",
45
- "Number=Sing|POS=PRON|Person=1|Polite=Infm|PronType=Prs":"Number=Sing|Person=1|Polite=Infm|PronType=Prs",
46
- "Number=Sing|POS=PRON|PronType=Ind":"Number=Sing|PronType=Ind",
47
- "POS=VERB|Voice=Act":"Voice=Act",
48
- "POS=DET|PronType=Emp":"PronType=Emp",
49
- "POS=VERB|Voice=Pass":"Voice=Pass",
 
 
 
 
 
 
 
 
50
  "POS=ADV|PronType=Dem":"PronType=Dem",
51
- "POS=NOUN|Typo=Yes":"Typo=Yes",
52
- "POS=ADP|Typo=Yes":"Typo=Yes",
53
- "Number=Plur|POS=PRON|PronType=Ind":"Number=Plur|PronType=Ind",
54
- "POS=VERB|Typo=Yes|Voice=Pass":"Typo=Yes|Voice=Pass",
55
- "POS=X":"",
 
 
 
 
 
 
 
 
 
56
  "POS=PRON|PronType=Tot":"PronType=Tot",
57
- "POS=SCONJ|Typo=Yes":"Typo=Yes",
58
- "Number=Plur|POS=PRON|Person=2|Polite=Infm|PronType=Prs":"Number=Plur|Person=2|Polite=Infm|PronType=Prs",
59
- "NumType=Card|POS=NUM|Typo=Yes":"NumType=Card|Typo=Yes",
 
 
 
 
 
 
60
  "Clusivity=Ex|Number=Plur|POS=PRON|Person=1|PronType=Prs":"Clusivity=Ex|Number=Plur|Person=1|PronType=Prs",
 
 
 
 
 
 
61
  "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs":"Number=Sing|Person=2|Polite=Form|PronType=Prs",
62
- "Foreign=Yes|POS=X":"Foreign=Yes",
63
- "POS=ADV|PronType=Rel":"PronType=Rel",
64
- "Mood=Imp|POS=VERB|Voice=Act":"Mood=Imp|Voice=Act",
65
- "Number=Sing|POS=NOUN|Typo=Yes":"Number=Sing|Typo=Yes",
66
- "POS=PROPN|Typo=Yes":"Typo=Yes",
67
- "POS=DET":"",
68
- "Number=Sing|POS=DET|PronType=Ind":"Number=Sing|PronType=Ind",
69
- "POS=DET|PronType=Ind|Typo=Yes":"PronType=Ind|Typo=Yes",
70
- "Abbr=Yes|POS=DET|PronType=Dem":"Abbr=Yes|PronType=Dem",
71
- "POS=PRON|PronType=Ind":"PronType=Ind",
72
- "POS=VERB|Typo=Yes":"Typo=Yes",
73
- "Abbr=Yes|POS=PROPN":"Abbr=Yes",
74
- "Abbr=Yes|POS=PRON|PronType=Rel":"Abbr=Yes|PronType=Rel",
75
- "Number=Plur|POS=PRON|PronType=Int":"Number=Plur|PronType=Int",
76
- "Abbr=Yes|POS=PART|Polarity=Neg":"Abbr=Yes|Polarity=Neg",
77
- "POS=ADV|PronType=Tot":"PronType=Tot",
78
- "Abbr=Yes|POS=ADV":"Abbr=Yes",
79
- "POS=ADV|Typo=Yes":"Typo=Yes",
80
- "POS=X|Typo=Yes":"Typo=Yes",
 
 
 
 
 
 
 
 
 
 
 
81
  "Number=Sing|POS=PRON|Person=2|PronType=Prs":"Number=Sing|Person=2|PronType=Prs",
82
- "POS=ADV|PronType=Int|Typo=Yes":"PronType=Int|Typo=Yes",
83
- "NumType=Ord|POS=ADJ|Typo=Yes":"NumType=Ord|Typo=Yes"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
84
  },
85
  "labels_pos":{
86
  "POS=PROPN":96,
87
  "POS=AUX":87,
88
- "Definite=Ind|POS=DET|PronType=Art":90,
89
  "Number=Sing|POS=NOUN":92,
90
  "POS=PRON|PronType=Rel":95,
91
- "Mood=Ind|POS=VERB|Voice=Pass":100,
92
  "POS=ADP":85,
93
  "POS=PUNCT":97,
 
94
  "POS=NOUN":92,
95
  "POS=ADV":86,
96
  "POS=CCONJ":89,
97
- "POS=SCONJ":98,
98
- "Mood=Ind|POS=VERB|Voice=Act":100,
99
  "POS=VERB":100,
100
  "POS=DET|PronType=Tot":90,
101
- "Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
 
102
  "Number=Plur|POS=PRON|Person=3|PronType=Prs":95,
103
- "POS=PRON|PronType=Prs|Reflex=Yes":95,
104
  "POS=DET|PronType=Dem":90,
105
  "NumType=Card|POS=NUM":93,
106
- "POS=ADJ":84,
107
- "Number=Plur|POS=DET|PronType=Ind":90,
108
- "NumType=Card|POS=NUM|PronType=Tot":93,
109
- "POS=PART|Polarity=Neg":94,
 
 
110
  "POS=PRON|PronType=Int":95,
111
- "NumType=Ord|POS=ADJ":84,
112
- "POS=PART":94,
 
 
 
 
 
113
  "POS=PRON|PronType=Dem":95,
114
- "POS=DET|PronType=Ind":90,
115
- "Number=Plur|POS=NOUN":92,
116
  "Number=Sing|POS=PRON|Person=1|Polite=Form|PronType=Prs":95,
 
 
 
117
  "POS=ADV|PronType=Int":86,
118
  "Clusivity=In|Number=Plur|POS=PRON|Person=1|PronType=Prs":95,
119
- "Definite=Def|POS=DET|PronType=Art":90,
120
- "POS=SYM":99,
121
- "Degree=Sup|POS=ADJ":84,
122
- "POS=INTJ":91,
 
 
 
 
 
 
 
 
 
 
 
 
123
  "Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs":95,
124
- "POS=ADV|PronType=Ind":86,
 
 
 
 
 
125
  "Number=Sing|POS=PRON|Person=3|Polite=Form|PronType=Prs":95,
126
- "Number=Sing|POS=PRON|Person=1|Polite=Infm|PronType=Prs":95,
127
- "Number=Sing|POS=PRON|PronType=Ind":95,
128
- "POS=VERB|Voice=Act":100,
129
- "POS=DET|PronType=Emp":90,
130
- "POS=VERB|Voice=Pass":100,
 
 
 
 
 
 
 
 
131
  "POS=ADV|PronType=Dem":86,
132
- "POS=NOUN|Typo=Yes":92,
133
- "POS=ADP|Typo=Yes":85,
134
- "Number=Plur|POS=PRON|PronType=Ind":95,
135
- "POS=VERB|Typo=Yes|Voice=Pass":100,
136
- "POS=X":101,
 
 
 
 
 
 
 
 
 
137
  "POS=PRON|PronType=Tot":95,
138
- "POS=SCONJ|Typo=Yes":98,
139
- "Number=Plur|POS=PRON|Person=2|Polite=Infm|PronType=Prs":95,
140
- "NumType=Card|POS=NUM|Typo=Yes":93,
 
 
 
 
 
 
141
  "Clusivity=Ex|Number=Plur|POS=PRON|Person=1|PronType=Prs":95,
 
 
 
 
 
 
142
  "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs":95,
143
- "Foreign=Yes|POS=X":101,
144
- "POS=ADV|PronType=Rel":86,
145
- "Mood=Imp|POS=VERB|Voice=Act":100,
146
- "Number=Sing|POS=NOUN|Typo=Yes":92,
147
- "POS=PROPN|Typo=Yes":96,
148
- "POS=DET":90,
149
- "Number=Sing|POS=DET|PronType=Ind":90,
150
- "POS=DET|PronType=Ind|Typo=Yes":90,
151
- "Abbr=Yes|POS=DET|PronType=Dem":90,
152
- "POS=PRON|PronType=Ind":95,
153
- "POS=VERB|Typo=Yes":100,
154
- "Abbr=Yes|POS=PROPN":96,
155
- "Abbr=Yes|POS=PRON|PronType=Rel":95,
156
- "Number=Plur|POS=PRON|PronType=Int":95,
157
- "Abbr=Yes|POS=PART|Polarity=Neg":94,
158
- "POS=ADV|PronType=Tot":86,
159
- "Abbr=Yes|POS=ADV":86,
160
- "POS=ADV|Typo=Yes":86,
161
- "POS=X|Typo=Yes":101,
 
 
 
 
 
 
 
 
 
 
 
162
  "Number=Sing|POS=PRON|Person=2|PronType=Prs":95,
163
- "POS=ADV|PronType=Int|Typo=Yes":86,
164
- "NumType=Ord|POS=ADJ|Typo=Yes":84
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
165
  },
166
  "overwrite":true
167
  }
 
4
  "labels_morph":{
5
  "POS=PROPN":"",
6
  "POS=AUX":"",
7
+ "POS=DET|PronType=Ind":"PronType=Ind",
8
  "Number=Sing|POS=NOUN":"Number=Sing",
9
  "POS=PRON|PronType=Rel":"PronType=Rel",
10
+ "Number=Sing|POS=VERB|Voice=Pass":"Number=Sing|Voice=Pass",
11
  "POS=ADP":"",
12
  "POS=PUNCT":"",
13
+ "Number=Sing|POS=PROPN":"Number=Sing",
14
  "POS=NOUN":"",
15
  "POS=ADV":"",
16
  "POS=CCONJ":"",
17
+ "Number=Sing|POS=VERB|Voice=Act":"Number=Sing|Voice=Act",
 
18
  "POS=VERB":"",
19
  "POS=DET|PronType=Tot":"PronType=Tot",
20
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3":"Number=Sing|Number[psor]=Sing|Person[psor]=3",
21
+ "POS=SCONJ":"",
22
  "Number=Plur|POS=PRON|Person=3|PronType=Prs":"Number=Plur|Person=3|PronType=Prs",
 
23
  "POS=DET|PronType=Dem":"PronType=Dem",
24
  "NumType=Card|POS=NUM":"NumType=Card",
25
+ "Degree=Pos|Number=Sing|POS=NOUN":"Degree=Pos|Number=Sing",
26
+ "Degree=Pos|Number=Sing|POS=ADJ":"Degree=Pos|Number=Sing",
27
+ "NumType=Card|POS=DET|PronType=Ind":"NumType=Card|PronType=Ind",
28
+ "Degree=Pos|Number=Sing|POS=ADP":"Degree=Pos|Number=Sing",
29
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=3":"Number[psor]=Sing|Person[psor]=3",
30
+ "Number=Sing|POS=VERB":"Number=Sing",
31
  "POS=PRON|PronType=Int":"PronType=Int",
32
+ "Number=Sing|POS=ADV|Voice=Act":"Number=Sing|Voice=Act",
33
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Act",
34
+ "Number=Sing|POS=ADP|Voice=Act":"Number=Sing|Voice=Act",
35
+ "POS=ADJ":"",
36
+ "Number[psor]=Sing|POS=ADP|Person[psor]=3":"Number[psor]=Sing|Person[psor]=3",
37
+ "Degree=Pos|Number=Sing|POS=DET":"Degree=Pos|Number=Sing",
38
+ "Degree=Pos|Number=Sing|POS=VERB":"Degree=Pos|Number=Sing",
39
  "POS=PRON|PronType=Dem":"PronType=Dem",
40
+ "POS=PART|Polarity=Neg":"Polarity=Neg",
41
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3":"Degree=Pos|Number=Sing|Number[psor]=Sing|Person[psor]=3",
42
  "Number=Sing|POS=PRON|Person=1|Polite=Form|PronType=Prs":"Number=Sing|Person=1|Polite=Form|PronType=Prs",
43
+ "Number=Sing|POS=ADJ":"Number=Sing",
44
+ "Number=Sing|POS=PRON|Person=3|PronType=Prs":"Number=Sing|Person=3|PronType=Prs",
45
+ "POS=SYM":"",
46
  "POS=ADV|PronType=Int":"PronType=Int",
47
  "Clusivity=In|Number=Plur|POS=PRON|Person=1|PronType=Prs":"Clusivity=In|Number=Plur|Person=1|PronType=Prs",
48
+ "Number=Sing|POS=ADJ|Voice=Act":"Number=Sing|Voice=Act",
49
+ "Degree=Pos|Number=Sing|POS=PROPN":"Degree=Pos|Number=Sing",
50
+ "Degree=Pos|Number=Sing|POS=ADV":"Degree=Pos|Number=Sing",
51
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3|Voice=Pass":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Pass",
52
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Act",
53
+ "Number=Sing|POS=PROPN|Voice=Act":"Number=Sing|Voice=Act",
54
+ "Number=Sing|POS=NOUN|Voice=Act":"Number=Sing|Voice=Act",
55
+ "POS=DET":"",
56
+ "Number=Sing|POS=DET|Voice=Act":"Number=Sing|Voice=Act",
57
+ "NumType=Card|POS=PRON|PronType=Ind":"NumType=Card|PronType=Ind",
58
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3":"Number=Sing|Number[psor]=Sing|Person[psor]=3",
59
+ "Number=Sing|POS=DET":"Number=Sing",
60
+ "Number=Sing|POS=ADJ|Voice=Pass":"Number=Sing|Voice=Pass",
61
+ "POS=CCONJ|PronType=Dem":"PronType=Dem",
62
+ "Number=Sing|POS=ADP":"Number=Sing",
63
+ "Number=Sing|POS=ADV":"Number=Sing",
64
  "Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs":"Number=Sing|Person=2|Polite=Infm|PronType=Prs",
65
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=2":"Number[psor]=Sing|Person[psor]=2",
66
+ "Number=Plur|Number[psor]=Sing|POS=NOUN|Person[psor]=2":"Number=Plur|Number[psor]=Sing|Person[psor]=2",
67
+ "Number=Sing|POS=PRON":"Number=Sing",
68
+ "POS=PRON":"",
69
+ "NumType=Card|POS=ADV|PronType=Ind":"NumType=Card|PronType=Ind",
70
+ "NumType=Card|Number[psor]=Sing|POS=NUM|Person[psor]=3":"NumType=Card|Number[psor]=Sing|Person[psor]=3",
71
  "Number=Sing|POS=PRON|Person=3|Polite=Form|PronType=Prs":"Number=Sing|Person=3|Polite=Form|PronType=Prs",
72
+ "POS=DET|PronType=Int":"PronType=Int",
73
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3":"Number=Sing|Number[psor]=Sing|Person[psor]=3",
74
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=1":"Number=Sing|Number[psor]=Sing|Person[psor]=1",
75
+ "Degree=Pos|Number=Sing|POS=SCONJ":"Degree=Pos|Number=Sing",
76
+ "POS=PRON|PronType=Ind":"PronType=Ind",
77
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3|Voice=Pass":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Pass",
78
+ "POS=VERB|PronType=Ind":"PronType=Ind",
79
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3":"Degree=Pos|Number=Sing|Number[psor]=Sing|Person[psor]=3",
80
+ "Number=Sing|POS=SCONJ":"Number=Sing",
81
+ "Degree=Sup|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3":"Degree=Sup|Number=Sing|Number[psor]=Sing|Person[psor]=3",
82
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3":"Degree=Pos|Number=Sing|Number[psor]=Sing|Person[psor]=3",
83
+ "Number=Plur|Number[psor]=Sing|POS=NOUN|Person[psor]=3":"Number=Plur|Number[psor]=Sing|Person[psor]=3",
84
+ "Number=Plur|POS=NOUN":"Number=Plur",
85
  "POS=ADV|PronType=Dem":"PronType=Dem",
86
+ "Number=Sing|POS=VERB|Person=1|Voice=Act":"Number=Sing|Person=1|Voice=Act",
87
+ "Degree=Sup|Number=Sing|POS=ADJ":"Degree=Sup|Number=Sing",
88
+ "Number=Sing|POS=ADP|Voice=Pass":"Number=Sing|Voice=Pass",
89
+ "Number[psor]=Sing|POS=PART|Person[psor]=3":"Number[psor]=Sing|Person[psor]=3",
90
+ "Number=Sing|POS=NOUN|Voice=Pass":"Number=Sing|Voice=Pass",
91
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=CCONJ|Person[psor]=3":"Degree=Pos|Number=Sing|Number[psor]=Sing|Person[psor]=3",
92
+ "POS=PART":"",
93
+ "Number=Sing|Number[psor]=Sing|POS=PART|Person[psor]=3|Voice=Pass":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Pass",
94
+ "Degree=Sup|Number=Sing|POS=ADV":"Degree=Sup|Number=Sing",
95
+ "Number=Sing|POS=PRON|Voice=Act":"Number=Sing|Voice=Act",
96
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Act",
97
+ "Gender=Masc|Number=Sing|POS=PROPN":"Gender=Masc|Number=Sing",
98
+ "Number[psor]=Sing|POS=PRON|Person[psor]=3|PronType=Tot":"Number[psor]=Sing|Person[psor]=3|PronType=Tot",
99
+ "Degree=Pos|Number=Sing|POS=X":"Degree=Pos|Number=Sing",
100
  "POS=PRON|PronType=Tot":"PronType=Tot",
101
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3":"Degree=Pos|Number=Sing|Number[psor]=Sing|Person[psor]=3",
102
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3":"Degree=Pos|Number=Sing|Number[psor]=Sing|Person[psor]=3",
103
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3":"Number=Sing|Number[psor]=Sing|Person[psor]=3",
104
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=2":"Number=Sing|Number[psor]=Sing|Person[psor]=2",
105
+ "POS=SCONJ|PronType=Int":"PronType=Int",
106
+ "Number=Plur|POS=PRON|Person=2|PronType=Prs":"Number=Plur|Person=2|PronType=Prs",
107
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=1|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=1|Voice=Act",
108
+ "Number[psor]=Sing|POS=DET|Person[psor]=3":"Number[psor]=Sing|Person[psor]=3",
109
+ "Number=Sing|Number[psor]=Sing|POS=PRON|Person[psor]=3":"Number=Sing|Number[psor]=Sing|Person[psor]=3",
110
  "Clusivity=Ex|Number=Plur|POS=PRON|Person=1|PronType=Prs":"Clusivity=Ex|Number=Plur|Person=1|PronType=Prs",
111
+ "Number=Plur|POS=VERB|Voice=Act":"Number=Plur|Voice=Act",
112
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Act",
113
+ "Degree=Pos|Number=Sing|POS=NOUN|Polarity=Neg":"Degree=Pos|Number=Sing|Polarity=Neg",
114
+ "POS=X":"",
115
+ "Number[psor]=Sing|POS=ADJ|Person[psor]=3":"Number[psor]=Sing|Person[psor]=3",
116
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3":"Number=Sing|Number[psor]=Sing|Person[psor]=3",
117
  "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs":"Number=Sing|Person=2|Polite=Form|PronType=Prs",
118
+ "Number=Sing|POS=PRON|Person=1|Polite=Infm|PronType=Prs":"Number=Sing|Person=1|Polite=Infm|PronType=Prs",
119
+ "Number=Sing|POS=PROPN|Voice=Pass":"Number=Sing|Voice=Pass",
120
+ "POS=ADV|Polarity=Neg":"Polarity=Neg",
121
+ "NumType=Card|Number=Sing|POS=NUM":"NumType=Card|Number=Sing",
122
+ "Number[psor]=Sing|POS=ADV|Person[psor]=2":"Number[psor]=Sing|Person[psor]=2",
123
+ "Number[psor]=Sing|POS=ADV|Person[psor]=3":"Number[psor]=Sing|Person[psor]=3",
124
+ "Degree=Sup|Number=Sing|POS=PROPN":"Degree=Sup|Number=Sing",
125
+ "POS=PROPN|Polarity=Neg":"Polarity=Neg",
126
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=2|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=2|Voice=Act",
127
+ "Number=Sing|POS=PROPN|Person=1|Voice=Act":"Number=Sing|Person=1|Voice=Act",
128
+ "POS=SCONJ|PronType=Dem":"PronType=Dem",
129
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=2|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=2|Voice=Act",
130
+ "Number=Sing|POS=CCONJ":"Number=Sing",
131
+ "Degree=Sup|Number=Sing|POS=VERB":"Degree=Sup|Number=Sing",
132
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3":"Number=Sing|Number[psor]=Sing|Person[psor]=3",
133
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Act",
134
+ "Degree=Pos|Number=Sing|POS=PRON":"Degree=Pos|Number=Sing",
135
+ "Number=Sing|POS=ADV|Voice=Pass":"Number=Sing|Voice=Pass",
136
+ "Number[psor]=Sing|POS=ADP|Person[psor]=2":"Number[psor]=Sing|Person[psor]=2",
137
+ "Number=Sing|POS=SYM":"Number=Sing",
138
+ "POS=ADJ|Polarity=Neg":"Polarity=Neg",
139
+ "Degree=Pos|NumType=Card|Number=Sing|POS=NUM":"Degree=Pos|NumType=Card|Number=Sing",
140
+ "Number=Sing|Number[psor]=Sing|POS=SCONJ|Person[psor]=3":"Number=Sing|Number[psor]=Sing|Person[psor]=3",
141
+ "Degree=Pos|Number=Sing|POS=CCONJ":"Degree=Pos|Number=Sing",
142
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=1":"Number[psor]=Sing|Person[psor]=1",
143
+ "Number=Sing|POS=CCONJ|Voice=Act":"Number=Sing|Voice=Act",
144
+ "Gender=Masc|Number=Sing|POS=NOUN":"Gender=Masc|Number=Sing",
145
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3|Voice=Pass":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Pass",
146
+ "Gender=Fem|Number=Sing|POS=PROPN":"Gender=Fem|Number=Sing",
147
+ "POS=VERB|PronType=Dem":"PronType=Dem",
148
  "Number=Sing|POS=PRON|Person=2|PronType=Prs":"Number=Sing|Person=2|PronType=Prs",
149
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3":"Gender=Masc|Number=Sing|Number[psor]=Sing|Person[psor]=3",
150
+ "Number=Sing|POS=PART|Voice=Act":"Number=Sing|Voice=Act",
151
+ "Degree=Sup|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3":"Degree=Sup|Number=Sing|Number[psor]=Sing|Person[psor]=3",
152
+ "POS=ADP|PronType=Int":"PronType=Int",
153
+ "Number[psor]=Sing|POS=VERB|Person[psor]=3":"Number[psor]=Sing|Person[psor]=3",
154
+ "Number[psor]=Sing|POS=PRON|Person[psor]=3|PronType=Rel":"Number[psor]=Sing|Person[psor]=3|PronType=Rel",
155
+ "Degree=Pos|Number=Sing|POS=AUX":"Degree=Pos|Number=Sing",
156
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=1":"Number=Sing|Number[psor]=Sing|Person[psor]=1",
157
+ "Number=Sing|POS=SCONJ|Voice=Pass":"Number=Sing|Voice=Pass",
158
+ "Degree=Sup|Number=Sing|POS=ADP":"Degree=Sup|Number=Sing",
159
+ "Number=Sing|POS=SCONJ|Voice=Act":"Number=Sing|Voice=Act",
160
+ "NumType=Card|POS=DET|PronType=Int":"NumType=Card|PronType=Int",
161
+ "Degree=Pos|Number=Sing|POS=PART|Polarity=Neg":"Degree=Pos|Number=Sing|Polarity=Neg",
162
+ "Degree=Sup|Number=Sing|POS=SCONJ":"Degree=Sup|Number=Sing",
163
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=1|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=1|Voice=Act",
164
+ "Number=Plur|POS=ADJ":"Number=Plur",
165
+ "POS=VERB|PronType=Int":"PronType=Int",
166
+ "Number=Sing|POS=VERB|Person=2|Voice=Act":"Number=Sing|Person=2|Voice=Act",
167
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=2":"Degree=Pos|Number=Sing|Number[psor]=Sing|Person[psor]=2",
168
+ "Gender=Masc|Number=Sing|POS=ADJ":"Gender=Masc|Number=Sing",
169
+ "Number[psor]=Sing|POS=ADV|Person[psor]=3|PronType=Tot":"Number[psor]=Sing|Person[psor]=3|PronType=Tot",
170
+ "POS=DET|PronType=Rel":"PronType=Rel",
171
+ "Number=Sing|POS=NOUN|Polarity=Neg":"Number=Sing|Polarity=Neg",
172
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=2":"Number=Sing|Number[psor]=Sing|Person[psor]=2",
173
+ "NumType=Card|Number=Sing|POS=NUM|Voice=Act":"NumType=Card|Number=Sing|Voice=Act",
174
+ "Degree=Pos|Number=Plur|POS=ADJ":"Degree=Pos|Number=Plur",
175
+ "Number[psor]=Sing|POS=DET|Person[psor]=3|PronType=Tot":"Number[psor]=Sing|Person[psor]=3|PronType=Tot",
176
+ "Number[psor]=Sing|POS=PROPN|Person[psor]=1":"Number[psor]=Sing|Person[psor]=1",
177
+ "Gender=Fem|Number=Sing|POS=NOUN":"Gender=Fem|Number=Sing",
178
+ "Number=Sing|POS=VERB|Person=1":"Number=Sing|Person=1",
179
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3":"Degree=Pos|Number=Sing|Number[psor]=Sing|Person[psor]=3",
180
+ "NumType=Card|Number[psor]=Sing|POS=DET|Person[psor]=3|PronType=Ind":"NumType=Card|Number[psor]=Sing|Person[psor]=3|PronType=Ind",
181
+ "POS=ADV|PronType=Tot":"PronType=Tot",
182
+ "Degree=Pos|Number=Plur|POS=ADV":"Degree=Pos|Number=Plur",
183
+ "Number=Plur|POS=ADV|Voice=Act":"Number=Plur|Voice=Act",
184
+ "POS=CCONJ|PronType=Int":"PronType=Int",
185
+ "Degree=Pos|Number=Sing|POS=PART":"Degree=Pos|Number=Sing",
186
+ "Number[psor]=Sing|POS=PRON|Person[psor]=2":"Number[psor]=Sing|Person[psor]=2",
187
+ "Number=Plur|POS=VERB":"Number=Plur",
188
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3|Voice=Pass":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Pass",
189
+ "Degree=Pos|Number=Sing|POS=PUNCT":"Degree=Pos|Number=Sing",
190
+ "Number[psor]=Sing|POS=ADP|Person[psor]=1":"Number[psor]=Sing|Person[psor]=1",
191
+ "Degree=Sup|Number=Sing|POS=NOUN":"Degree=Sup|Number=Sing",
192
+ "Number[psor]=Sing|POS=PART|Person[psor]=3|Polarity=Neg":"Number[psor]=Sing|Person[psor]=3|Polarity=Neg",
193
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=3|Voice=Act",
194
+ "POS=NOUN|Polarity=Neg":"Polarity=Neg",
195
+ "Number[psor]=Sing|POS=PROPN|Person[psor]=2":"Number[psor]=Sing|Person[psor]=2",
196
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=2|Voice=Act":"Number=Sing|Number[psor]=Sing|Person[psor]=2|Voice=Act"
197
  },
198
  "labels_pos":{
199
  "POS=PROPN":96,
200
  "POS=AUX":87,
201
+ "POS=DET|PronType=Ind":90,
202
  "Number=Sing|POS=NOUN":92,
203
  "POS=PRON|PronType=Rel":95,
204
+ "Number=Sing|POS=VERB|Voice=Pass":100,
205
  "POS=ADP":85,
206
  "POS=PUNCT":97,
207
+ "Number=Sing|POS=PROPN":96,
208
  "POS=NOUN":92,
209
  "POS=ADV":86,
210
  "POS=CCONJ":89,
211
+ "Number=Sing|POS=VERB|Voice=Act":100,
 
212
  "POS=VERB":100,
213
  "POS=DET|PronType=Tot":90,
214
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3":92,
215
+ "POS=SCONJ":98,
216
  "Number=Plur|POS=PRON|Person=3|PronType=Prs":95,
 
217
  "POS=DET|PronType=Dem":90,
218
  "NumType=Card|POS=NUM":93,
219
+ "Degree=Pos|Number=Sing|POS=NOUN":92,
220
+ "Degree=Pos|Number=Sing|POS=ADJ":84,
221
+ "NumType=Card|POS=DET|PronType=Ind":90,
222
+ "Degree=Pos|Number=Sing|POS=ADP":85,
223
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=3":92,
224
+ "Number=Sing|POS=VERB":100,
225
  "POS=PRON|PronType=Int":95,
226
+ "Number=Sing|POS=ADV|Voice=Act":86,
227
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3|Voice=Act":100,
228
+ "Number=Sing|POS=ADP|Voice=Act":85,
229
+ "POS=ADJ":84,
230
+ "Number[psor]=Sing|POS=ADP|Person[psor]=3":85,
231
+ "Degree=Pos|Number=Sing|POS=DET":90,
232
+ "Degree=Pos|Number=Sing|POS=VERB":100,
233
  "POS=PRON|PronType=Dem":95,
234
+ "POS=PART|Polarity=Neg":94,
235
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3":92,
236
  "Number=Sing|POS=PRON|Person=1|Polite=Form|PronType=Prs":95,
237
+ "Number=Sing|POS=ADJ":84,
238
+ "Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
239
+ "POS=SYM":99,
240
  "POS=ADV|PronType=Int":86,
241
  "Clusivity=In|Number=Plur|POS=PRON|Person=1|PronType=Prs":95,
242
+ "Number=Sing|POS=ADJ|Voice=Act":84,
243
+ "Degree=Pos|Number=Sing|POS=PROPN":96,
244
+ "Degree=Pos|Number=Sing|POS=ADV":86,
245
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3|Voice=Pass":100,
246
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3|Voice=Act":92,
247
+ "Number=Sing|POS=PROPN|Voice=Act":96,
248
+ "Number=Sing|POS=NOUN|Voice=Act":92,
249
+ "POS=DET":90,
250
+ "Number=Sing|POS=DET|Voice=Act":90,
251
+ "NumType=Card|POS=PRON|PronType=Ind":95,
252
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3":86,
253
+ "Number=Sing|POS=DET":90,
254
+ "Number=Sing|POS=ADJ|Voice=Pass":84,
255
+ "POS=CCONJ|PronType=Dem":89,
256
+ "Number=Sing|POS=ADP":85,
257
+ "Number=Sing|POS=ADV":86,
258
  "Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs":95,
259
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=2":92,
260
+ "Number=Plur|Number[psor]=Sing|POS=NOUN|Person[psor]=2":92,
261
+ "Number=Sing|POS=PRON":95,
262
+ "POS=PRON":95,
263
+ "NumType=Card|POS=ADV|PronType=Ind":86,
264
+ "NumType=Card|Number[psor]=Sing|POS=NUM|Person[psor]=3":93,
265
  "Number=Sing|POS=PRON|Person=3|Polite=Form|PronType=Prs":95,
266
+ "POS=DET|PronType=Int":90,
267
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3":96,
268
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=1":96,
269
+ "Degree=Pos|Number=Sing|POS=SCONJ":98,
270
+ "POS=PRON|PronType=Ind":95,
271
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3|Voice=Pass":92,
272
+ "POS=VERB|PronType=Ind":100,
273
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3":84,
274
+ "Number=Sing|POS=SCONJ":98,
275
+ "Degree=Sup|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3":84,
276
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3":85,
277
+ "Number=Plur|Number[psor]=Sing|POS=NOUN|Person[psor]=3":92,
278
+ "Number=Plur|POS=NOUN":92,
279
  "POS=ADV|PronType=Dem":86,
280
+ "Number=Sing|POS=VERB|Person=1|Voice=Act":100,
281
+ "Degree=Sup|Number=Sing|POS=ADJ":84,
282
+ "Number=Sing|POS=ADP|Voice=Pass":85,
283
+ "Number[psor]=Sing|POS=PART|Person[psor]=3":94,
284
+ "Number=Sing|POS=NOUN|Voice=Pass":92,
285
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=CCONJ|Person[psor]=3":89,
286
+ "POS=PART":94,
287
+ "Number=Sing|Number[psor]=Sing|POS=PART|Person[psor]=3|Voice=Pass":94,
288
+ "Degree=Sup|Number=Sing|POS=ADV":86,
289
+ "Number=Sing|POS=PRON|Voice=Act":95,
290
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3|Voice=Act":96,
291
+ "Gender=Masc|Number=Sing|POS=PROPN":96,
292
+ "Number[psor]=Sing|POS=PRON|Person[psor]=3|PronType=Tot":95,
293
+ "Degree=Pos|Number=Sing|POS=X":101,
294
  "POS=PRON|PronType=Tot":95,
295
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3":86,
296
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3":100,
297
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3":85,
298
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=2":92,
299
+ "POS=SCONJ|PronType=Int":98,
300
+ "Number=Plur|POS=PRON|Person=2|PronType=Prs":95,
301
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=1|Voice=Act":100,
302
+ "Number[psor]=Sing|POS=DET|Person[psor]=3":90,
303
+ "Number=Sing|Number[psor]=Sing|POS=PRON|Person[psor]=3":95,
304
  "Clusivity=Ex|Number=Plur|POS=PRON|Person=1|PronType=Prs":95,
305
+ "Number=Plur|POS=VERB|Voice=Act":100,
306
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=3|Voice=Act":86,
307
+ "Degree=Pos|Number=Sing|POS=NOUN|Polarity=Neg":92,
308
+ "POS=X":101,
309
+ "Number[psor]=Sing|POS=ADJ|Person[psor]=3":84,
310
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=3":100,
311
  "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs":95,
312
+ "Number=Sing|POS=PRON|Person=1|Polite=Infm|PronType=Prs":95,
313
+ "Number=Sing|POS=PROPN|Voice=Pass":96,
314
+ "POS=ADV|Polarity=Neg":86,
315
+ "NumType=Card|Number=Sing|POS=NUM":93,
316
+ "Number[psor]=Sing|POS=ADV|Person[psor]=2":86,
317
+ "Number[psor]=Sing|POS=ADV|Person[psor]=3":86,
318
+ "Degree=Sup|Number=Sing|POS=PROPN":96,
319
+ "POS=PROPN|Polarity=Neg":96,
320
+ "Number=Sing|Number[psor]=Sing|POS=VERB|Person[psor]=2|Voice=Act":100,
321
+ "Number=Sing|POS=PROPN|Person=1|Voice=Act":96,
322
+ "POS=SCONJ|PronType=Dem":98,
323
+ "Number=Sing|Number[psor]=Sing|POS=ADV|Person[psor]=2|Voice=Act":86,
324
+ "Number=Sing|POS=CCONJ":89,
325
+ "Degree=Sup|Number=Sing|POS=VERB":100,
326
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3":84,
327
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3|Voice=Act":84,
328
+ "Degree=Pos|Number=Sing|POS=PRON":95,
329
+ "Number=Sing|POS=ADV|Voice=Pass":86,
330
+ "Number[psor]=Sing|POS=ADP|Person[psor]=2":85,
331
+ "Number=Sing|POS=SYM":99,
332
+ "POS=ADJ|Polarity=Neg":84,
333
+ "Degree=Pos|NumType=Card|Number=Sing|POS=NUM":93,
334
+ "Number=Sing|Number[psor]=Sing|POS=SCONJ|Person[psor]=3":98,
335
+ "Degree=Pos|Number=Sing|POS=CCONJ":89,
336
+ "Number[psor]=Sing|POS=NOUN|Person[psor]=1":92,
337
+ "Number=Sing|POS=CCONJ|Voice=Act":89,
338
+ "Gender=Masc|Number=Sing|POS=NOUN":92,
339
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3|Voice=Pass":85,
340
+ "Gender=Fem|Number=Sing|POS=PROPN":96,
341
+ "POS=VERB|PronType=Dem":100,
342
  "Number=Sing|POS=PRON|Person=2|PronType=Prs":95,
343
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3":92,
344
+ "Number=Sing|POS=PART|Voice=Act":94,
345
+ "Degree=Sup|Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=3":92,
346
+ "POS=ADP|PronType=Int":85,
347
+ "Number[psor]=Sing|POS=VERB|Person[psor]=3":100,
348
+ "Number[psor]=Sing|POS=PRON|Person[psor]=3|PronType=Rel":95,
349
+ "Degree=Pos|Number=Sing|POS=AUX":87,
350
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=1":92,
351
+ "Number=Sing|POS=SCONJ|Voice=Pass":98,
352
+ "Degree=Sup|Number=Sing|POS=ADP":85,
353
+ "Number=Sing|POS=SCONJ|Voice=Act":98,
354
+ "NumType=Card|POS=DET|PronType=Int":90,
355
+ "Degree=Pos|Number=Sing|POS=PART|Polarity=Neg":94,
356
+ "Degree=Sup|Number=Sing|POS=SCONJ":98,
357
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=1|Voice=Act":92,
358
+ "Number=Plur|POS=ADJ":84,
359
+ "POS=VERB|PronType=Int":100,
360
+ "Number=Sing|POS=VERB|Person=2|Voice=Act":100,
361
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=2":84,
362
+ "Gender=Masc|Number=Sing|POS=ADJ":84,
363
+ "Number[psor]=Sing|POS=ADV|Person[psor]=3|PronType=Tot":86,
364
+ "POS=DET|PronType=Rel":90,
365
+ "Number=Sing|POS=NOUN|Polarity=Neg":92,
366
+ "Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=2":96,
367
+ "NumType=Card|Number=Sing|POS=NUM|Voice=Act":93,
368
+ "Degree=Pos|Number=Plur|POS=ADJ":84,
369
+ "Number[psor]=Sing|POS=DET|Person[psor]=3|PronType=Tot":90,
370
+ "Number[psor]=Sing|POS=PROPN|Person[psor]=1":96,
371
+ "Gender=Fem|Number=Sing|POS=NOUN":92,
372
+ "Number=Sing|POS=VERB|Person=1":100,
373
+ "Degree=Pos|Number=Sing|Number[psor]=Sing|POS=PROPN|Person[psor]=3":96,
374
+ "NumType=Card|Number[psor]=Sing|POS=DET|Person[psor]=3|PronType=Ind":90,
375
+ "POS=ADV|PronType=Tot":86,
376
+ "Degree=Pos|Number=Plur|POS=ADV":86,
377
+ "Number=Plur|POS=ADV|Voice=Act":86,
378
+ "POS=CCONJ|PronType=Int":89,
379
+ "Degree=Pos|Number=Sing|POS=PART":94,
380
+ "Number[psor]=Sing|POS=PRON|Person[psor]=2":95,
381
+ "Number=Plur|POS=VERB":100,
382
+ "Number=Sing|Number[psor]=Sing|POS=ADJ|Person[psor]=3|Voice=Pass":84,
383
+ "Degree=Pos|Number=Sing|POS=PUNCT":97,
384
+ "Number[psor]=Sing|POS=ADP|Person[psor]=1":85,
385
+ "Degree=Sup|Number=Sing|POS=NOUN":92,
386
+ "Number[psor]=Sing|POS=PART|Person[psor]=3|Polarity=Neg":94,
387
+ "Number=Sing|Number[psor]=Sing|POS=ADP|Person[psor]=3|Voice=Act":85,
388
+ "POS=NOUN|Polarity=Neg":92,
389
+ "Number[psor]=Sing|POS=PROPN|Person[psor]=2":96,
390
+ "Number=Sing|Number[psor]=Sing|POS=NOUN|Person[psor]=2|Voice=Act":92
391
  },
392
  "overwrite":true
393
  }
morphologizer/model CHANGED
Binary files a/morphologizer/model and b/morphologizer/model differ
 
ner/model CHANGED
Binary files a/ner/model and b/ner/model differ
 
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves�3{"0":{},"1":{},"2":{},"3":{},"4":{"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��moves��{"0":{},"1":{"GPE":4114,"PERSON":3450,"ORG":1984,"ORDINAL":1951,"DATE":1679,"PRODUCT":907,"CARDINAL":725,"WORK_OF_ART":649,"LOC":619,"EVENT":616,"FAC":602,"NORP":486,"QUANTITY":370,"LAW":314,"PERCENT":138,"LANGUAGE":133,"TIME":50,"MONEY":45},"2":{"GPE":4114,"PERSON":3450,"ORG":1984,"ORDINAL":1951,"DATE":1679,"PRODUCT":907,"CARDINAL":725,"WORK_OF_ART":649,"LOC":619,"EVENT":616,"FAC":602,"NORP":486,"QUANTITY":370,"LAW":314,"PERCENT":138,"LANGUAGE":133,"TIME":50,"MONEY":45},"3":{"GPE":4114,"PERSON":3450,"ORG":1984,"ORDINAL":1951,"DATE":1679,"PRODUCT":907,"CARDINAL":725,"WORK_OF_ART":649,"LOC":619,"EVENT":616,"FAC":602,"NORP":486,"QUANTITY":370,"LAW":314,"PERCENT":138,"LANGUAGE":133,"TIME":50,"MONEY":45},"4":{"GPE":4114,"PERSON":3450,"ORG":1984,"ORDINAL":1951,"DATE":1679,"PRODUCT":907,"CARDINAL":725,"WORK_OF_ART":649,"LOC":619,"EVENT":616,"FAC":602,"NORP":486,"QUANTITY":370,"LAW":314,"PERCENT":138,"LANGUAGE":133,"TIME":50,"MONEY":45,"":1},"5":{"":1}}�cfg��neg_key�
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2738f320e714bbe52de113a1eeb00ac1cb55706a794cb67b6fc3442a29ec0e0
3
- size 1750016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6b7fcac65a90ba54bf257ff22140821ddd9958db2447df85a934e57924243e7
3
+ size 1744340
parser/moves CHANGED
@@ -1 +1 @@
1
- ��moves�{"0":{"":36809},"1":{"":56313},"2":{"case":8690,"punct":6049,"nsubj":5534,"advmod":2999,"cc":2690,"nsubj:pass":1726,"mark":1658,"nummod":1525,"det":1313,"aux":921,"obl":852,"cop":845,"amod":398,"obj":251,"advcl":250,"nmod":217,"obl:tmod":211,"compound":124,"xcomp":112,"case:adv":72,"advmod:emph":57,"acl":51,"parataxis":42,"dep":41,"nmod:lmod":37},"3":{"punct":7872,"flat:name":6453,"nmod":6282,"compound":5703,"obj":4488,"obl":3927,"conj":3876,"amod":2949,"acl:relcl":2164,"appos":2119,"det":1663,"nummod":1602,"nmod:poss":1139,"xcomp":1014,"acl":923,"advcl":798,"advmod":400,"dep":359,"ccomp":336,"obl:tmod":319,"flat":305,"advmod:emph":292,"parataxis":274,"fixed":237,"case":174,"cc":134,"nmod:tmod":83,"nsubj":74,"mark":70,"obl:agent":45,"flat:foreign":41,"nsubj:pass":40},"4":{"ROOT":4482}}�cfg��neg_key�
 
1
+ ��moves�z{"0":{"":34155},"1":{"":58901},"2":{"case":9174,"nsubj":5567,"advmod":3739,"punct":3606,"cc":2671,"nsubj:pass":1730,"det":1659,"nummod":1496,"mark":1215,"obl":965,"cop":843,"amod":408,"obj":261,"advcl":219,"compound":131,"xcomp":112,"nmod":109,"acl":53,"parataxis":44,"dep":43,"appos":34},"3":{"punct":10991,"flat":9150,"compound":5814,"obj":4390,"obl":4093,"conj":3757,"nmod":3449,"amod":3231,"acl":2622,"appos":2127,"nummod":1988,"det":1957,"xcomp":995,"advcl":837,"compound:plur":530,"fixed":496,"advmod":487,"dep":400,"ccomp":357,"case":340,"parataxis":276,"punct||conj":159,"cc":158,"nsubj":87,"nsubj:pass":39},"4":{"ROOT":4477}}�cfg��neg_key�
tagger/cfg CHANGED
@@ -3,52 +3,86 @@
3
  "labels":[
4
  "APP",
5
  "ASP",
 
6
  "ASP+PS3",
 
7
  "ASS",
 
8
  "B--",
9
  "B--+PS3",
 
10
  "CC-",
11
- "CCONJ",
 
12
  "CD-",
 
13
  "CO-",
 
14
  "D--",
 
15
  "D--+PS3",
 
16
  "F--",
 
17
  "F--+PS2",
 
 
18
  "G--",
19
  "G--+PS3",
 
20
  "H--",
 
21
  "I--",
22
  "M--",
23
  "M--+PS3",
 
24
  "NOUN",
25
  "NPD",
 
 
26
  "NSD",
 
 
27
  "NSD+PS3",
 
28
  "NSF",
29
  "NSM",
 
30
  "NUM",
31
  "O--",
32
  "PP1",
 
33
  "PP2",
34
  "PP3",
 
35
  "PROPN",
36
  "PS1",
37
  "PS1+VSA",
 
38
  "PS2",
 
39
  "PS3",
 
40
  "R--",
 
 
41
  "R--+PS3",
42
  "S--",
43
- "SYM",
44
  "T--",
45
  "VERB",
46
  "VPA",
47
  "VSA",
 
48
  "VSA+PS2",
49
  "VSA+PS3",
 
50
  "VSP",
 
 
51
  "W--",
 
 
52
  "X--",
53
  "Z--"
54
  ],
 
3
  "labels":[
4
  "APP",
5
  "ASP",
6
+ "ASP+PS2",
7
  "ASP+PS3",
8
+ "ASP+T--",
9
  "ASS",
10
+ "ASS+PS3",
11
  "B--",
12
  "B--+PS3",
13
+ "B--+T--",
14
  "CC-",
15
+ "CC-+PS3",
16
+ "CC-+T--",
17
  "CD-",
18
+ "CD-+PS3",
19
  "CO-",
20
+ "CO-+PS3",
21
  "D--",
22
+ "D--+PS2",
23
  "D--+PS3",
24
+ "D--+T--",
25
  "F--",
26
+ "F--+PS1",
27
  "F--+PS2",
28
+ "F--+PS3",
29
+ "F--+T--",
30
  "G--",
31
  "G--+PS3",
32
+ "G--+T--",
33
  "H--",
34
+ "H--+T--",
35
  "I--",
36
  "M--",
37
  "M--+PS3",
38
+ "M--+T--",
39
  "NOUN",
40
  "NPD",
41
+ "NPD+PS2",
42
+ "NPD+PS3",
43
  "NSD",
44
+ "NSD+PS1",
45
+ "NSD+PS2",
46
  "NSD+PS3",
47
+ "NSD+T--",
48
  "NSF",
49
  "NSM",
50
+ "NSM+PS3",
51
  "NUM",
52
  "O--",
53
  "PP1",
54
+ "PP1+T--",
55
  "PP2",
56
  "PP3",
57
+ "PP3+T--",
58
  "PROPN",
59
  "PS1",
60
  "PS1+VSA",
61
+ "PS1+VSA+T--",
62
  "PS2",
63
+ "PS2+VSA",
64
  "PS3",
65
+ "PUNCT",
66
  "R--",
67
+ "R--+PS1",
68
+ "R--+PS2",
69
  "R--+PS3",
70
  "S--",
71
+ "S--+PS3",
72
  "T--",
73
  "VERB",
74
  "VPA",
75
  "VSA",
76
+ "VSA+PS1",
77
  "VSA+PS2",
78
  "VSA+PS3",
79
+ "VSA+T--",
80
  "VSP",
81
+ "VSP+PS3",
82
+ "VSP+T--",
83
  "W--",
84
+ "W--+T--",
85
+ "X",
86
  "X--",
87
  "Z--"
88
  ],
tagger/model CHANGED
Binary files a/tagger/model and b/tagger/model differ
 
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97122c73406442748f5a28b415d61067a62dcbda60fdad337f0a9a9917d12e93
3
  size 34126801
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d68c9f3d46615221b44fd6ba3425358171ae84091e425ee893e17bb35ce16f8c
3
  size 34126801
trainable_lemmatizer/cfg CHANGED
@@ -4,334 +4,223 @@
4
  2,
5
  4,
6
  6,
7
- 9,
8
- 11,
9
- 13,
10
  15,
11
- 17,
12
  19,
13
- 21,
14
  22,
15
  24,
16
  26,
17
- 28,
 
 
18
  31,
19
- 33,
20
  36,
21
- 38,
22
- 39,
23
  40,
24
  42,
25
  44,
26
  46,
27
- 47,
28
- 49,
29
  51,
30
  53,
31
  55,
32
  57,
33
- 59,
 
34
  61,
35
  63,
36
  65,
37
  67,
38
- 68,
39
  70,
40
- 71,
41
  73,
42
  75,
43
- 77,
44
- 64,
45
- 79,
46
- 80,
47
  83,
48
  84,
49
  85,
50
- 87,
51
- 89,
 
52
  91,
53
- 93,
54
- 95,
 
55
  97,
56
  98,
57
  100,
58
  101,
59
- 102,
60
- 105,
 
61
  107,
62
  108,
63
- 110,
64
- 112,
 
65
  114,
66
- 115,
 
67
  117,
68
  118,
 
69
  121,
 
70
  123,
71
  124,
72
  125,
73
- 127,
 
74
  128,
 
75
  129,
76
- 131,
77
- 18,
78
  133,
 
79
  135,
80
- 137,
81
  138,
82
  139,
83
  141,
84
  142,
 
85
  144,
86
- 145,
87
  147,
 
88
  149,
 
 
89
  151,
90
  152,
91
  153,
92
- 154,
93
  156,
94
  157,
 
95
  159,
96
  161,
97
  162,
 
98
  164,
99
  165,
100
  167,
101
- 168,
102
  170,
 
 
103
  172,
104
- 174,
 
105
  176,
 
 
106
  178,
107
  179,
 
 
 
 
108
  182,
109
  183,
 
 
 
110
  185,
 
111
  187,
112
  188,
113
- 190,
 
114
  191,
 
115
  193,
116
  194,
117
  195,
118
- 58,
119
- 197,
120
- 199,
121
  200,
122
  201,
123
  202,
 
 
124
  204,
 
125
  206,
 
126
  208,
127
- 210,
128
- 211,
129
  212,
130
  213,
131
  214,
132
- 37,
133
  216,
134
- 217,
 
135
  220,
136
  221,
137
- 76,
138
  223,
139
- 224,
140
  225,
141
  226,
142
  227,
143
  228,
144
  229,
145
  231,
 
 
146
  234,
147
- 235,
148
  237,
 
149
  239,
150
  240,
151
  241,
152
  243,
 
153
  245,
154
  246,
 
155
  248,
156
- 249,
157
- 251,
158
  253,
 
159
  255,
 
160
  257,
161
  259,
 
 
162
  262,
163
  263,
164
- 264,
165
  266,
166
  267,
167
  268,
 
 
168
  270,
169
  271,
170
- 56,
171
  273,
172
  274,
173
  275,
174
  276,
 
175
  278,
176
  279,
177
  280,
178
- 282,
179
- 283,
180
- 284,
181
- 286,
182
- 287,
183
- 288,
184
- 289,
185
- 291,
186
- 293,
187
- 295,
188
- 297,
189
- 298,
190
- 299,
191
- 16,
192
- 300,
193
- 301,
194
- 302,
195
- 304,
196
- 305,
197
- 307,
198
- 309,
199
- 109,
200
- 310,
201
- 311,
202
- 313,
203
- 315,
204
- 317,
205
- 318,
206
- 66,
207
- 319,
208
- 62,
209
- 321,
210
- 322,
211
- 323,
212
- 324,
213
- 326,
214
- 328,
215
- 330,
216
- 331,
217
- 333,
218
- 334,
219
- 60,
220
- 50,
221
- 336,
222
- 337,
223
- 338,
224
- 339,
225
- 340,
226
- 341,
227
- 342,
228
- 343,
229
- 345,
230
- 346,
231
- 209,
232
- 348,
233
- 349,
234
- 350,
235
- 351,
236
- 352,
237
- 354,
238
- 356,
239
- 358,
240
- 359,
241
- 360,
242
- 361,
243
- 0,
244
- 362,
245
- 363,
246
- 365,
247
- 367,
248
- 369,
249
- 371,
250
- 372,
251
- 373,
252
- 375,
253
- 377,
254
- 378,
255
- 381,
256
- 382,
257
- 69,
258
- 383,
259
- 386,
260
- 387,
261
- 389,
262
- 390,
263
- 391,
264
- 392,
265
- 393,
266
- 394,
267
- 396,
268
- 397,
269
- 399,
270
- 400,
271
- 401,
272
- 402,
273
- 403,
274
- 404,
275
- 405,
276
- 407,
277
- 408,
278
- 409,
279
- 411,
280
- 413,
281
- 414,
282
- 416,
283
- 418,
284
- 419,
285
- 420,
286
- 421,
287
- 422,
288
- 423,
289
- 424,
290
- 425,
291
- 426,
292
- 427,
293
- 429,
294
- 431,
295
- 432,
296
- 435,
297
- 436,
298
- 437,
299
- 438,
300
- 439,
301
- 440,
302
- 441,
303
- 443,
304
- 444,
305
- 446,
306
- 448,
307
- 449,
308
- 450,
309
- 452,
310
- 453,
311
- 455,
312
- 457,
313
- 459,
314
- 460,
315
- 461,
316
- 462,
317
- 463,
318
- 464,
319
- 466,
320
- 468,
321
- 92,
322
- 469,
323
- 470,
324
- 472,
325
- 474,
326
- 475,
327
- 476,
328
- 477,
329
- 478,
330
- 480,
331
- 482,
332
- 483,
333
- 484,
334
- 485,
335
- 486
336
  ]
337
  }
 
4
  2,
5
  4,
6
  6,
7
+ 8,
8
+ 10,
9
+ 12,
10
  15,
 
11
  19,
 
12
  22,
13
  24,
14
  26,
15
+ 27,
16
+ 29,
17
+ 30,
18
  31,
19
+ 34,
20
  36,
21
+ 37,
 
22
  40,
23
  42,
24
  44,
25
  46,
26
+ 48,
27
+ 50,
28
  51,
29
  53,
30
  55,
31
  57,
32
+ 47,
33
+ 58,
34
  61,
35
  63,
36
  65,
37
  67,
38
+ 69,
39
  70,
40
+ 72,
41
  73,
42
  75,
43
+ 76,
44
+ 78,
45
+ 81,
 
46
  83,
47
  84,
48
  85,
49
+ 88,
50
+ 11,
51
+ 90,
52
  91,
53
+ 92,
54
+ 94,
55
+ 96,
56
  97,
57
  98,
58
  100,
59
  101,
60
+ 103,
61
+ 104,
62
+ 106,
63
  107,
64
  108,
65
+ 109,
66
+ 111,
67
+ 113,
68
  114,
69
+ 43,
70
+ 116,
71
  117,
72
  118,
73
+ 119,
74
  121,
75
+ 122,
76
  123,
77
  124,
78
  125,
79
+ 25,
80
+ 126,
81
  128,
82
+ 56,
83
  129,
84
+ 130,
85
+ 132,
86
  133,
87
+ 134,
88
  135,
89
+ 136,
90
  138,
91
  139,
92
  141,
93
  142,
94
+ 143,
95
  144,
96
+ 146,
97
  147,
98
+ 148,
99
  149,
100
+ 41,
101
+ 150,
102
  151,
103
  152,
104
  153,
105
+ 155,
106
  156,
107
  157,
108
+ 158,
109
  159,
110
  161,
111
  162,
112
+ 163,
113
  164,
114
  165,
115
  167,
116
+ 169,
117
  170,
118
+ 171,
119
+ 9,
120
  172,
121
+ 173,
122
+ 175,
123
  176,
124
+ 177,
125
+ 77,
126
  178,
127
  179,
128
+ 49,
129
+ 180,
130
+ 23,
131
+ 181,
132
  182,
133
  183,
134
+ 184,
135
+ 45,
136
+ 35,
137
  185,
138
+ 186,
139
  187,
140
  188,
141
+ 189,
142
+ 120,
143
  191,
144
+ 192,
145
  193,
146
  194,
147
  195,
148
+ 196,
149
+ 198,
 
150
  200,
151
  201,
152
  202,
153
+ 0,
154
+ 203,
155
  204,
156
+ 205,
157
  206,
158
+ 207,
159
  208,
160
+ 209,
161
+ 52,
162
  212,
163
  213,
164
  214,
165
+ 215,
166
  216,
167
+ 218,
168
+ 219,
169
  220,
170
  221,
171
+ 222,
172
  223,
 
173
  225,
174
  226,
175
  227,
176
  228,
177
  229,
178
  231,
179
+ 232,
180
+ 233,
181
  234,
182
+ 236,
183
  237,
184
+ 238,
185
  239,
186
  240,
187
  241,
188
  243,
189
+ 244,
190
  245,
191
  246,
192
+ 247,
193
  248,
194
+ 250,
195
+ 252,
196
  253,
197
+ 254,
198
  255,
199
+ 256,
200
  257,
201
  259,
202
+ 260,
203
+ 261,
204
  262,
205
  263,
206
+ 265,
207
  266,
208
  267,
209
  268,
210
+ 269,
211
+ 68,
212
  270,
213
  271,
214
+ 272,
215
  273,
216
  274,
217
  275,
218
  276,
219
+ 277,
220
  278,
221
  279,
222
  280,
223
+ 281,
224
+ 282
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
225
  ]
226
  }
trainable_lemmatizer/model CHANGED
Binary files a/trainable_lemmatizer/model and b/trainable_lemmatizer/model differ
 
trainable_lemmatizer/trees CHANGED
Binary files a/trainable_lemmatizer/trees and b/trainable_lemmatizer/trees differ
 
vocab/strings.json CHANGED
The diff for this file is too large to render. See raw diff