Adriane Boyd commited on
Commit
c2cc21c
1 Parent(s): cc45a23

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,62 +14,62 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.8106995885
18
  - name: NER Recall
19
  type: recall
20
- value: 0.8208333333
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.8157349896
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
- value: 0.9763184658
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
- value: 0.9763184658
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
- value: 0.97360647
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
- value: 0.9458595642
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
- value: 0.8620092701
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
- value: 0.8339289703
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
- value: 0.8692579505
73
  ---
74
  ### Details: https://spacy.io/models/da#da_core_news_trf
75
 
@@ -78,8 +78,8 @@ Danish transformer pipeline (Maltehb/danish-bert-botxo). Components: transformer
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `da_core_news_trf` |
81
- | **Version** | `3.3.0` |
82
- | **spaCy** | `>=3.3.0.dev0,<3.4.0` |
83
  | **Default Pipeline** | `transformer`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
84
  | **Components** | `transformer`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -109,18 +109,18 @@ Danish transformer pipeline (Maltehb/danish-bert-botxo). Components: transformer
109
  | `TOKEN_P` | 99.78 |
110
  | `TOKEN_R` | 99.75 |
111
  | `TOKEN_F` | 99.76 |
112
- | `POS_ACC` | 97.63 |
113
- | `MORPH_ACC` | 97.36 |
114
- | `MORPH_MICRO_P` | 98.75 |
115
- | `MORPH_MICRO_R` | 98.03 |
116
- | `MORPH_MICRO_F` | 98.39 |
117
- | `SENTS_P` | 86.62 |
118
- | `SENTS_R` | 87.23 |
119
- | `SENTS_F` | 86.93 |
120
- | `DEP_UAS` | 86.20 |
121
- | `DEP_LAS` | 83.39 |
122
- | `LEMMA_ACC` | 94.59 |
123
- | `TAG_ACC` | 97.63 |
124
- | `ENTS_P` | 81.07 |
125
- | `ENTS_R` | 82.08 |
126
- | `ENTS_F` | 81.57 |
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.8118609407
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.8270833333
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.8194014448
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.9746222394
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
+ value: 0.9746222394
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
+ value: 0.971716389
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
+ value: 0.9459564165
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
+ value: 0.8596491228
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
+ value: 0.8301675978
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
+ value: 0.832319722
73
  ---
74
  ### Details: https://spacy.io/models/da#da_core_news_trf
75
 
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `da_core_news_trf` |
81
+ | **Version** | `3.4.0` |
82
+ | **spaCy** | `>=3.4.0,<3.5.0` |
83
  | **Default Pipeline** | `transformer`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
84
  | **Components** | `transformer`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
109
  | `TOKEN_P` | 99.78 |
110
  | `TOKEN_R` | 99.75 |
111
  | `TOKEN_F` | 99.76 |
112
+ | `POS_ACC` | 97.46 |
113
+ | `MORPH_ACC` | 97.17 |
114
+ | `MORPH_MICRO_P` | 98.72 |
115
+ | `MORPH_MICRO_R` | 97.61 |
116
+ | `MORPH_MICRO_F` | 98.16 |
117
+ | `SENTS_P` | 81.60 |
118
+ | `SENTS_R` | 84.93 |
119
+ | `SENTS_F` | 83.23 |
120
+ | `DEP_UAS` | 85.96 |
121
+ | `DEP_LAS` | 83.02 |
122
+ | `LEMMA_ACC` | 94.60 |
123
+ | `TAG_ACC` | 97.46 |
124
+ | `ENTS_P` | 81.19 |
125
+ | `ENTS_R` | 82.71 |
126
+ | `ENTS_F` | 81.94 |
accuracy.json CHANGED
@@ -3,51 +3,51 @@
3
  "token_p": 0.9977732598,
4
  "token_r": 0.9974835463,
5
  "token_f": 0.997628382,
6
- "pos_acc": 0.9763184658,
7
- "morph_acc": 0.97360647,
8
- "morph_micro_p": 0.9874911014,
9
- "morph_micro_r": 0.98026349,
10
- "morph_micro_f": 0.9838640221,
11
  "morph_per_feat": {
12
  "Mood": {
13
- "p": 0.9942638623,
14
- "r": 0.9914204004,
15
- "f": 0.9928400955
16
  },
17
  "Tense": {
18
- "p": 0.9826415094,
19
- "r": 0.9804216867,
20
- "f": 0.981530343
21
  },
22
  "VerbForm": {
23
- "p": 0.9840196681,
24
- "r": 0.9798041616,
25
- "f": 0.9819073904
26
  },
27
  "Voice": {
28
- "p": 0.9940074906,
29
- "r": 0.9917787743,
30
- "f": 0.9928918818
31
  },
32
  "Definite": {
33
- "p": 0.9900039984,
34
- "r": 0.9782694587,
35
- "f": 0.9841017488
36
  },
37
  "Gender": {
38
- "p": 0.979516454,
39
- "r": 0.9694250582,
40
- "f": 0.97444463
41
  },
42
  "Number": {
43
- "p": 0.9889473684,
44
- "r": 0.9801773605,
45
- "f": 0.9845428347
46
  },
47
  "AdpType": {
48
- "p": 0.996460177,
49
- "r": 0.9955791335,
50
- "f": 0.9960194604
51
  },
52
  "PartType": {
53
  "p": 1.0,
@@ -55,19 +55,19 @@
55
  "f": 0.9983739837
56
  },
57
  "Case": {
58
- "p": 0.992,
59
- "r": 0.9794628752,
60
- "f": 0.9856915739
61
  },
62
  "Person": {
63
- "p": 0.9857397504,
64
- "r": 0.9822380107,
65
- "f": 0.9839857651
66
  },
67
  "PronType": {
68
- "p": 0.9925619835,
69
- "r": 0.9876644737,
70
- "f": 0.9901071723
71
  },
72
  "NumType": {
73
  "p": 0.9865771812,
@@ -75,9 +75,9 @@
75
  "f": 0.98
76
  },
77
  "Degree": {
78
- "p": 0.9732685298,
79
- "r": 0.965060241,
80
- "f": 0.9691470054
81
  },
82
  "Reflex": {
83
  "p": 1.0,
@@ -100,14 +100,14 @@
100
  "f": 0.9942857143
101
  },
102
  "Foreign": {
103
- "p": 1.0,
104
- "r": 0.6,
105
- "f": 0.75
106
  },
107
  "Abbr": {
108
- "p": 0.75,
109
- "r": 0.6,
110
- "f": 0.6666666667
111
  },
112
  "Style": {
113
  "p": 1.0,
@@ -115,66 +115,66 @@
115
  "f": 1.0
116
  }
117
  },
118
- "sents_p": 0.8661971831,
119
- "sents_r": 0.8723404255,
120
- "sents_f": 0.8692579505,
121
- "dep_uas": 0.8620092701,
122
- "dep_las": 0.8339289703,
123
  "dep_las_per_type": {
124
  "advmod": {
125
- "p": 0.7837078652,
126
- "r": 0.7881355932,
127
- "f": 0.785915493
128
  },
129
  "root": {
130
- "p": 0.8533568905,
131
- "r": 0.8563829787,
132
- "f": 0.8548672566
133
  },
134
  "nsubj": {
135
- "p": 0.8970588235,
136
- "r": 0.9008438819,
137
- "f": 0.8989473684
138
  },
139
  "case": {
140
- "p": 0.9159248269,
141
- "r": 0.9132149901,
142
- "f": 0.9145679012
143
  },
144
  "obl": {
145
- "p": 0.7840375587,
146
- "r": 0.7779503106,
147
- "f": 0.7809820733
148
  },
149
  "cc": {
150
- "p": 0.8529411765,
151
- "r": 0.8430232558,
152
- "f": 0.8479532164
153
  },
154
  "conj": {
155
- "p": 0.7260273973,
156
- "r": 0.7066666667,
157
- "f": 0.7162162162
158
  },
159
  "obj": {
160
- "p": 0.8733944954,
161
- "r": 0.9242718447,
162
- "f": 0.8981132075
163
  },
164
  "aux": {
165
- "p": 0.8837209302,
166
- "r": 0.8862973761,
167
- "f": 0.885007278
168
  },
169
  "acl:relcl": {
170
- "p": 0.7428571429,
171
- "r": 0.7027027027,
172
- "f": 0.7222222222
173
  },
174
  "advmod:lmod": {
175
- "p": 0.7878787879,
176
  "r": 0.776119403,
177
- "f": 0.7819548872
178
  },
179
  "det": {
180
  "p": 0.9169381107,
@@ -187,74 +187,69 @@
187
  "f": 0.8620102215
188
  },
189
  "nmod:poss": {
190
- "p": 0.7741935484,
191
- "r": 0.7128712871,
192
- "f": 0.7422680412
193
  },
194
  "ccomp": {
195
- "p": 0.6721311475,
196
- "r": 0.6612903226,
197
- "f": 0.6666666667
198
  },
199
  "nummod": {
200
- "p": 0.8130081301,
201
- "r": 0.8333333333,
202
- "f": 0.8230452675
203
  },
204
  "flat": {
205
- "p": 0.825,
206
- "r": 0.8741721854,
207
- "f": 0.8488745981
208
  },
209
  "compound:prt": {
210
- "p": 0.65625,
211
- "r": 0.512195122,
212
- "f": 0.5753424658
213
  },
214
  "advcl": {
215
- "p": 0.6890756303,
216
- "r": 0.7068965517,
217
- "f": 0.6978723404
218
  },
219
  "mark": {
220
- "p": 0.9089026915,
221
- "r": 0.9014373717,
222
- "f": 0.9051546392
223
  },
224
  "cop": {
225
- "p": 0.8532608696,
226
- "r": 0.8971428571,
227
- "f": 0.8746518106
228
  },
229
  "dep": {
230
- "p": 0.2197802198,
231
- "r": 0.3773584906,
232
- "f": 0.2777777778
233
  },
234
  "nmod": {
235
- "p": 0.7321063395,
236
- "r": 0.69921875,
237
- "f": 0.7152847153
238
  },
239
  "iobj": {
240
  "p": 0.9375,
241
  "r": 0.6818181818,
242
  "f": 0.7894736842
243
  },
244
- "obl:lmod": {
245
- "p": 0.0,
246
- "r": 0.0,
247
- "f": 0.0
248
- },
249
  "xcomp": {
250
- "p": 0.5102040816,
251
- "r": 0.4237288136,
252
- "f": 0.462962963
253
  },
254
  "list": {
255
  "p": 0.5,
256
- "r": 0.2222222222,
257
- "f": 0.3076923077
258
  },
259
  "vocative": {
260
  "p": 0.0,
@@ -262,57 +257,62 @@
262
  "f": 0.0
263
  },
264
  "fixed": {
265
- "p": 0.9166666667,
266
- "r": 0.8048780488,
267
- "f": 0.8571428571
 
 
 
 
 
268
  },
269
  "expl": {
270
- "p": 0.9117647059,
271
  "r": 0.9117647059,
272
- "f": 0.9117647059
273
- },
274
- "appos": {
275
- "p": 0.6,
276
- "r": 0.6363636364,
277
- "f": 0.6176470588
278
  },
279
  "obl:tmod": {
280
- "p": 0.8,
281
- "r": 0.4444444444,
282
- "f": 0.5714285714
283
  },
284
  "discourse": {
285
  "p": 0.0,
286
  "r": 0.0,
287
  "f": 0.0
 
 
 
 
 
288
  }
289
  },
290
- "lemma_acc": 0.9458595642,
291
- "tag_acc": 0.9763184658,
292
- "ents_p": 0.8106995885,
293
- "ents_r": 0.8208333333,
294
- "ents_f": 0.8157349896,
295
  "ents_per_type": {
296
  "PER": {
297
- "p": 0.8841463415,
298
- "r": 0.8734939759,
299
- "f": 0.8787878788
300
  },
301
  "ORG": {
302
- "p": 0.7093023256,
303
  "r": 0.6777777778,
304
- "f": 0.6931818182
305
  },
306
  "MISC": {
307
- "p": 0.7272727273,
308
  "r": 0.7787610619,
309
- "f": 0.7521367521
310
  },
311
  "LOC": {
312
- "p": 0.8695652174,
313
- "r": 0.9009009009,
314
- "f": 0.8849557522
315
  }
316
  },
317
- "speed": 451.6438624119
318
  }
 
3
  "token_p": 0.9977732598,
4
  "token_r": 0.9974835463,
5
  "token_f": 0.997628382,
6
+ "pos_acc": 0.9746222394,
7
+ "morph_acc": 0.971716389,
8
+ "morph_micro_p": 0.9871860323,
9
+ "morph_micro_r": 0.9760738983,
10
+ "morph_micro_f": 0.9815985177,
11
  "morph_per_feat": {
12
  "Mood": {
13
+ "p": 0.9923150817,
14
+ "r": 0.9847473785,
15
+ "f": 0.9885167464
16
  },
17
  "Tense": {
18
+ "p": 0.9870525514,
19
+ "r": 0.9759036145,
20
+ "f": 0.9814464218
21
  },
22
  "VerbForm": {
23
+ "p": 0.9863861386,
24
+ "r": 0.9755201958,
25
+ "f": 0.9809230769
26
  },
27
  "Voice": {
28
+ "p": 0.9917293233,
29
+ "r": 0.985799701,
30
+ "f": 0.9887556222
31
  },
32
  "Definite": {
33
+ "p": 0.98915227,
34
+ "r": 0.9727380482,
35
+ "f": 0.980876494
36
  },
37
  "Gender": {
38
+ "p": 0.9797843666,
39
+ "r": 0.9664340312,
40
+ "f": 0.9730634097
41
  },
42
  "Number": {
43
+ "p": 0.9873217116,
44
+ "r": 0.9749608764,
45
+ "f": 0.9811023622
46
  },
47
  "AdpType": {
48
+ "p": 0.9973357016,
49
+ "r": 0.9929266136,
50
+ "f": 0.9951262738
51
  },
52
  "PartType": {
53
  "p": 1.0,
 
55
  "f": 0.9983739837
56
  },
57
  "Case": {
58
+ "p": 0.9919614148,
59
+ "r": 0.9747235387,
60
+ "f": 0.9832669323
61
  },
62
  "Person": {
63
+ "p": 0.9856630824,
64
+ "r": 0.9769094139,
65
+ "f": 0.9812667261
66
  },
67
  "PronType": {
68
+ "p": 0.9925373134,
69
+ "r": 0.984375,
70
+ "f": 0.9884393064
71
  },
72
  "NumType": {
73
  "p": 0.9865771812,
 
75
  "f": 0.98
76
  },
77
  "Degree": {
78
+ "p": 0.9697702539,
79
+ "r": 0.9662650602,
80
+ "f": 0.968014484
81
  },
82
  "Reflex": {
83
  "p": 1.0,
 
100
  "f": 0.9942857143
101
  },
102
  "Foreign": {
103
+ "p": 0.7777777778,
104
+ "r": 0.7,
105
+ "f": 0.7368421053
106
  },
107
  "Abbr": {
108
+ "p": 1.0,
109
+ "r": 0.4,
110
+ "f": 0.5714285714
111
  },
112
  "Style": {
113
  "p": 1.0,
 
115
  "f": 1.0
116
  }
117
  },
118
+ "sents_p": 0.8160136286,
119
+ "sents_r": 0.8492907801,
120
+ "sents_f": 0.832319722,
121
+ "dep_uas": 0.8596491228,
122
+ "dep_las": 0.8301675978,
123
  "dep_las_per_type": {
124
  "advmod": {
125
+ "p": 0.7773109244,
126
+ "r": 0.7838983051,
127
+ "f": 0.7805907173
128
  },
129
  "root": {
130
+ "p": 0.8293515358,
131
+ "r": 0.8617021277,
132
+ "f": 0.8452173913
133
  },
134
  "nsubj": {
135
+ "p": 0.8976545842,
136
+ "r": 0.888185654,
137
+ "f": 0.8928950159
138
  },
139
  "case": {
140
+ "p": 0.9175769613,
141
+ "r": 0.9112426036,
142
+ "f": 0.9143988125
143
  },
144
  "obl": {
145
+ "p": 0.7834394904,
146
+ "r": 0.7639751553,
147
+ "f": 0.7735849057
148
  },
149
  "cc": {
150
+ "p": 0.8425655977,
151
+ "r": 0.8401162791,
152
+ "f": 0.8413391557
153
  },
154
  "conj": {
155
+ "p": 0.7154696133,
156
+ "r": 0.6906666667,
157
+ "f": 0.7028493894
158
  },
159
  "obj": {
160
+ "p": 0.8701298701,
161
+ "r": 0.9106796117,
162
+ "f": 0.889943074
163
  },
164
  "aux": {
165
+ "p": 0.8699421965,
166
+ "r": 0.8775510204,
167
+ "f": 0.8737300435
168
  },
169
  "acl:relcl": {
170
+ "p": 0.7630057803,
171
+ "r": 0.7135135135,
172
+ "f": 0.7374301676
173
  },
174
  "advmod:lmod": {
175
+ "p": 0.8,
176
  "r": 0.776119403,
177
+ "f": 0.7878787879
178
  },
179
  "det": {
180
  "p": 0.9169381107,
 
187
  "f": 0.8620102215
188
  },
189
  "nmod:poss": {
190
+ "p": 0.7765957447,
191
+ "r": 0.7227722772,
192
+ "f": 0.7487179487
193
  },
194
  "ccomp": {
195
+ "p": 0.7586206897,
196
+ "r": 0.7096774194,
197
+ "f": 0.7333333333
198
  },
199
  "nummod": {
200
+ "p": 0.8032786885,
201
+ "r": 0.8166666667,
202
+ "f": 0.8099173554
203
  },
204
  "flat": {
205
+ "p": 0.8364779874,
206
+ "r": 0.880794702,
207
+ "f": 0.8580645161
208
  },
209
  "compound:prt": {
210
+ "p": 0.6666666667,
211
+ "r": 0.5365853659,
212
+ "f": 0.5945945946
213
  },
214
  "advcl": {
215
+ "p": 0.6746031746,
216
+ "r": 0.7327586207,
217
+ "f": 0.7024793388
218
  },
219
  "mark": {
220
+ "p": 0.9010309278,
221
+ "r": 0.8973305955,
222
+ "f": 0.8991769547
223
  },
224
  "cop": {
225
+ "p": 0.8742857143,
226
+ "r": 0.8742857143,
227
+ "f": 0.8742857143
228
  },
229
  "dep": {
230
+ "p": 0.2358490566,
231
+ "r": 0.4716981132,
232
+ "f": 0.3144654088
233
  },
234
  "nmod": {
235
+ "p": 0.7105263158,
236
+ "r": 0.685546875,
237
+ "f": 0.6978131213
238
  },
239
  "iobj": {
240
  "p": 0.9375,
241
  "r": 0.6818181818,
242
  "f": 0.7894736842
243
  },
 
 
 
 
 
244
  "xcomp": {
245
+ "p": 0.6,
246
+ "r": 0.406779661,
247
+ "f": 0.4848484848
248
  },
249
  "list": {
250
  "p": 0.5,
251
+ "r": 0.2777777778,
252
+ "f": 0.3571428571
253
  },
254
  "vocative": {
255
  "p": 0.0,
 
257
  "f": 0.0
258
  },
259
  "fixed": {
260
+ "p": 0.9444444444,
261
+ "r": 0.8292682927,
262
+ "f": 0.8831168831
263
+ },
264
+ "appos": {
265
+ "p": 0.7142857143,
266
+ "r": 0.6060606061,
267
+ "f": 0.6557377049
268
  },
269
  "expl": {
270
+ "p": 0.9393939394,
271
  "r": 0.9117647059,
272
+ "f": 0.9253731343
 
 
 
 
 
273
  },
274
  "obl:tmod": {
275
+ "p": 0.8333333333,
276
+ "r": 0.5555555556,
277
+ "f": 0.6666666667
278
  },
279
  "discourse": {
280
  "p": 0.0,
281
  "r": 0.0,
282
  "f": 0.0
283
+ },
284
+ "obl:lmod": {
285
+ "p": 0.0,
286
+ "r": 0.0,
287
+ "f": 0.0
288
  }
289
  },
290
+ "lemma_acc": 0.9459564165,
291
+ "tag_acc": 0.9746222394,
292
+ "ents_p": 0.8118609407,
293
+ "ents_r": 0.8270833333,
294
+ "ents_f": 0.8194014448,
295
  "ents_per_type": {
296
  "PER": {
297
+ "p": 0.9018404908,
298
+ "r": 0.8855421687,
299
+ "f": 0.8936170213
300
  },
301
  "ORG": {
302
+ "p": 0.7721518987,
303
  "r": 0.6777777778,
304
+ "f": 0.7218934911
305
  },
306
  "MISC": {
307
+ "p": 0.6717557252,
308
  "r": 0.7787610619,
309
+ "f": 0.7213114754
310
  },
311
  "LOC": {
312
+ "p": 0.8706896552,
313
+ "r": 0.9099099099,
314
+ "f": 0.8898678414
315
  }
316
  },
317
+ "speed": 4656.9787909711
318
  }
da_core_news_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28f147c7a0787272245429a6eedec0f834a98ebb48ab421b3ef75c4081bd52c5
3
- size 413499670
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd6c07a3173c0df1bd4fe360bf39067d6bc4f694a45d7db9f4eef0e7bcbdf8ac
3
+ size 413509117
lemmatizer/cfg CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "labels":[
3
- 0,
4
  2,
5
  4,
6
  6,
@@ -10,15 +10,16 @@
10
  14,
11
  16,
12
  18,
13
- 22,
14
- 26,
15
  28,
16
  30,
17
  32,
18
- 35,
19
- 37,
20
  39,
21
  41,
 
22
  43,
23
  45,
24
  47,
@@ -26,10 +27,10 @@
26
  51,
27
  53,
28
  55,
29
- 59,
30
- 63,
 
31
  67,
32
- 69,
33
  71,
34
  73,
35
  75,
@@ -43,183 +44,186 @@
43
  91,
44
  93,
45
  95,
46
- 97,
47
  101,
48
- 103,
49
  104,
50
- 106,
51
- 108,
52
  111,
53
- 115,
54
- 117,
55
- 119,
56
- 122,
57
  124,
58
  127,
59
- 130,
 
60
  133,
61
  134,
62
- 137,
63
- 139,
64
  140,
65
  142,
66
  144,
67
- 146,
 
68
  148,
69
- 150,
70
- 151,
71
  153,
72
- 154,
73
- 156,
74
- 160,
75
- 162,
76
- 163,
77
  166,
78
- 169,
 
79
  172,
80
  174,
81
- 176,
82
- 178,
83
- 180,
84
  182,
85
  184,
86
- 185,
87
- 187,
88
- 189,
89
  192,
90
  194,
91
  196,
92
- 198,
93
- 200,
94
- 202,
95
  204,
96
- 206,
 
97
  209,
98
  211,
 
99
  213,
100
- 214,
101
  217,
102
- 218,
103
- 220,
104
  222,
105
- 223,
106
  224,
107
  226,
108
- 228,
109
- 230,
110
  232,
111
  233,
112
  235,
113
- 237,
114
- 240,
115
- 242,
116
  243,
117
- 244,
118
- 246,
119
- 247,
120
  249,
121
- 250,
122
- 254,
123
- 260,
 
 
 
124
  264,
125
- 266,
126
  268,
127
  270,
128
- 272,
129
- 274,
130
  275,
131
- 276,
132
  279,
133
  281,
134
- 282,
135
- 284,
136
- 286,
137
- 288,
138
- 290,
139
- 292,
140
  296,
141
- 297,
142
- 299,
143
- 301,
144
- 303,
145
- 305,
146
- 307,
147
- 309,
148
  310,
149
- 311,
150
- 313,
151
- 315,
152
  318,
153
- 321,
 
154
  322,
155
  324,
156
  327,
157
- 328,
158
  330,
159
  331,
160
  333,
161
- 334,
162
- 335,
163
  337,
164
- 338,
165
  340,
166
- 341,
167
- 345,
 
 
168
  347,
169
- 348,
170
- 352,
171
  354,
172
  356,
 
173
  358,
174
- 360,
175
  364,
176
- 367,
177
- 369,
178
- 371,
179
- 372,
180
- 375,
181
  377,
182
  378,
183
- 379,
184
  382,
 
185
  385,
186
  386,
187
  389,
 
188
  393,
189
- 394,
190
- 395,
191
  397,
192
- 398,
193
  400,
194
- 402,
195
- 403,
196
- 405,
197
  406,
 
 
198
  409,
199
- 411,
 
200
  413,
201
  415,
202
- 417,
203
  419,
 
204
  422,
 
205
  424,
206
- 425,
207
  426,
208
- 428,
209
- 429,
210
- 432,
211
  433,
212
- 435,
213
  436,
214
  437,
215
- 438,
216
- 440,
217
- 442,
218
- 444,
219
  446,
220
- 447,
221
  449,
222
- 450,
223
  452,
224
  454,
225
  456,
@@ -228,22 +232,21 @@
228
  462,
229
  464,
230
  465,
231
- 466,
232
- 468,
233
- 471,
234
  472,
235
  475,
236
- 476,
237
  479,
238
- 480,
239
- 482,
240
  484,
241
- 485,
242
  488,
243
- 489,
244
- 492,
245
- 494,
246
- 497,
247
  499,
248
  500,
249
  501,
@@ -251,14 +254,12 @@
251
  504,
252
  505,
253
  506,
254
- 507,
255
  509,
256
- 510,
257
  511,
258
- 513,
259
- 515,
260
  516,
261
- 517,
262
  518,
263
  519,
264
  521,
@@ -272,13 +273,13 @@
272
  531,
273
  532,
274
  533,
275
- 534,
276
  536,
277
  537,
278
- 539,
279
  540,
280
- 542,
281
- 545,
282
  546,
283
  547,
284
  549,
@@ -290,124 +291,125 @@
290
  560,
291
  561,
292
  563,
293
- 565,
294
  566,
295
- 567,
296
  569,
297
  571,
298
- 572,
299
  573,
300
  575,
 
301
  577,
302
- 578,
303
- 582,
304
  584,
305
- 585,
306
  586,
307
- 589,
308
- 592,
309
- 594,
310
- 596,
311
- 600,
312
  601,
313
- 603,
314
  604,
315
- 605,
 
 
316
  609,
317
- 611,
318
  613,
 
319
  617,
320
- 619,
321
- 620,
322
  621,
323
- 622,
324
  623,
325
  624,
326
  625,
 
327
  627,
 
328
  629,
329
- 630,
330
  632,
331
  633,
332
  635,
333
  636,
 
334
  639,
335
- 641,
 
336
  645,
337
- 646,
338
- 647,
339
  649,
 
340
  651,
341
- 654,
342
  656,
343
- 657,
344
  659,
345
- 660,
346
- 662,
347
  663,
348
  664,
349
- 666,
350
- 668,
 
351
  670,
352
  672,
353
- 673,
354
  675,
355
  677,
356
- 678,
357
  680,
358
  681,
359
  683,
360
  685,
361
- 686,
362
  687,
 
363
  689,
364
- 690,
365
  691,
366
  692,
367
- 695,
368
- 696,
369
  697,
370
  698,
 
371
  700,
372
- 701,
373
- 703,
374
- 705,
375
  706,
376
  707,
377
  708,
378
- 712,
379
- 715,
380
- 717,
381
  718,
382
  719,
383
  723,
384
  725,
385
  728,
386
- 730,
387
  731,
388
  732,
389
- 734,
390
- 736,
 
391
  738,
392
  739,
393
  740,
394
  741,
395
  742,
396
- 743,
397
- 744,
398
- 747,
399
  748,
400
- 750,
401
- 754,
402
- 757,
403
  758,
404
  760,
 
405
  762,
406
- 763,
407
  764,
408
- 766,
409
  767,
410
  769,
 
411
  771,
412
  772,
413
  773,
@@ -420,34 +422,35 @@
420
  786,
421
  789,
422
  790,
423
- 792,
424
- 794,
425
  795,
426
  796,
427
- 798,
428
  799,
429
  800,
430
  801,
431
  802,
 
432
  804,
433
- 805,
434
  806,
435
  807,
436
  808,
 
437
  810,
438
- 811,
439
- 813,
440
- 815,
441
  816,
442
- 818,
443
- 820,
444
  821,
445
- 822,
446
  824,
447
  826,
448
  828,
449
  830,
450
  832,
451
- 834
 
452
  ]
453
  }
 
1
  {
2
  "labels":[
3
+ 1,
4
  2,
5
  4,
6
  6,
 
10
  14,
11
  16,
12
  18,
13
+ 20,
14
+ 24,
15
  28,
16
  30,
17
  32,
18
+ 34,
19
+ 36,
20
  39,
21
  41,
22
+ 42,
23
  43,
24
  45,
25
  47,
 
27
  51,
28
  53,
29
  55,
30
+ 57,
31
+ 61,
32
+ 65,
33
  67,
 
34
  71,
35
  73,
36
  75,
 
44
  91,
45
  93,
46
  95,
47
+ 99,
48
  101,
49
+ 102,
50
  104,
51
+ 107,
 
52
  111,
53
+ 113,
54
+ 116,
55
+ 118,
56
+ 121,
57
  124,
58
  127,
59
+ 128,
60
+ 131,
61
  133,
62
  134,
63
+ 136,
64
+ 138,
65
  140,
66
  142,
67
  144,
68
+ 145,
69
+ 147,
70
  148,
71
+ 149,
 
72
  153,
73
+ 155,
74
+ 158,
75
+ 161,
76
+ 164,
 
77
  166,
78
+ 168,
79
+ 170,
80
  172,
81
  174,
82
+ 175,
83
+ 177,
84
+ 179,
85
  182,
86
  184,
87
+ 186,
88
+ 188,
89
+ 190,
90
  192,
91
  194,
92
  196,
93
+ 199,
94
+ 201,
95
+ 203,
96
  204,
97
+ 207,
98
+ 208,
99
  209,
100
  211,
101
+ 212,
102
  213,
103
+ 215,
104
  217,
105
+ 219,
106
+ 221,
107
  222,
 
108
  224,
109
  226,
110
+ 229,
111
+ 231,
112
  232,
113
  233,
114
  235,
115
+ 236,
116
+ 238,
117
+ 239,
118
  243,
 
 
 
119
  249,
120
+ 253,
121
+ 255,
122
+ 257,
123
+ 259,
124
+ 261,
125
+ 263,
126
  264,
127
+ 265,
128
  268,
129
  270,
130
+ 271,
131
+ 273,
132
  275,
133
+ 277,
134
  279,
135
  281,
136
+ 283,
137
+ 285,
138
+ 287,
139
+ 289,
140
+ 293,
141
+ 294,
142
  296,
143
+ 298,
144
+ 300,
145
+ 302,
146
+ 304,
147
+ 306,
148
+ 308,
 
149
  310,
150
+ 312,
151
+ 314,
152
+ 316,
153
  318,
154
+ 319,
155
+ 320,
156
  322,
157
  324,
158
  327,
 
159
  330,
160
  331,
161
  333,
162
+ 336,
 
163
  337,
164
+ 339,
165
  340,
166
+ 342,
167
+ 343,
168
+ 344,
169
+ 346,
170
  347,
171
+ 349,
172
+ 350,
173
  354,
174
  356,
175
+ 357,
176
  358,
177
+ 362,
178
  364,
179
+ 366,
180
+ 368,
181
+ 370,
182
+ 374,
 
183
  377,
184
  378,
185
+ 381,
186
  382,
187
+ 384,
188
  385,
189
  386,
190
  389,
191
+ 390,
192
  393,
193
+ 396,
 
194
  397,
 
195
  400,
196
+ 404,
 
 
197
  406,
198
+ 407,
199
+ 408,
200
  409,
201
+ 410,
202
+ 412,
203
  413,
204
  415,
205
+ 416,
206
  419,
207
+ 421,
208
  422,
209
+ 423,
210
  424,
 
211
  426,
212
+ 427,
213
+ 430,
214
+ 431,
215
  433,
216
+ 434,
217
  436,
218
  437,
219
+ 439,
220
+ 441,
221
+ 443,
222
+ 445,
223
  446,
224
+ 448,
225
  449,
226
+ 451,
227
  452,
228
  454,
229
  456,
 
232
  462,
233
  464,
234
  465,
235
+ 467,
236
+ 470,
 
237
  472,
238
  475,
239
+ 478,
240
  479,
241
+ 481,
242
+ 483,
243
  484,
244
+ 487,
245
  488,
246
+ 491,
247
+ 493,
248
+ 496,
249
+ 498,
250
  499,
251
  500,
252
  501,
 
254
  504,
255
  505,
256
  506,
257
+ 508,
258
  509,
 
259
  511,
260
+ 512,
261
+ 514,
262
  516,
 
263
  518,
264
  519,
265
  521,
 
273
  531,
274
  532,
275
  533,
276
+ 535,
277
  536,
278
  537,
279
+ 538,
280
  540,
281
+ 541,
282
+ 543,
283
  546,
284
  547,
285
  549,
 
291
  560,
292
  561,
293
  563,
294
+ 564,
295
  566,
296
+ 568,
297
  569,
298
  571,
 
299
  573,
300
  575,
301
+ 576,
302
  577,
303
+ 579,
304
+ 580,
305
  584,
 
306
  586,
307
+ 587,
308
+ 590,
309
+ 593,
310
+ 595,
311
+ 597,
312
  601,
313
+ 602,
314
  604,
315
+ 606,
316
+ 607,
317
+ 608,
318
  609,
 
319
  613,
320
+ 615,
321
  617,
 
 
322
  621,
 
323
  623,
324
  624,
325
  625,
326
+ 626,
327
  627,
328
+ 628,
329
  629,
330
+ 631,
331
  632,
332
  633,
333
  635,
334
  636,
335
+ 638,
336
  639,
337
+ 640,
338
+ 643,
339
  645,
 
 
340
  649,
341
+ 650,
342
  651,
343
+ 653,
344
  656,
345
+ 658,
346
  659,
347
+ 661,
 
348
  663,
349
  664,
350
+ 665,
351
+ 667,
352
+ 669,
353
  670,
354
  672,
355
+ 674,
356
  675,
357
  677,
358
+ 679,
359
  680,
360
  681,
361
  683,
362
  685,
 
363
  687,
364
+ 688,
365
  689,
 
366
  691,
367
  692,
368
+ 693,
369
+ 694,
370
  697,
371
  698,
372
+ 699,
373
  700,
374
+ 702,
375
+ 704,
 
376
  706,
377
  707,
378
  708,
379
+ 709,
380
+ 713,
381
+ 716,
382
  718,
383
  719,
384
  723,
385
  725,
386
  728,
387
+ 729,
388
  731,
389
  732,
390
+ 733,
391
+ 735,
392
+ 737,
393
  738,
394
  739,
395
  740,
396
  741,
397
  742,
398
+ 745,
399
+ 746,
 
400
  748,
401
+ 752,
402
+ 755,
403
+ 756,
404
  758,
405
  760,
406
+ 761,
407
  762,
 
408
  764,
409
+ 765,
410
  767,
411
  769,
412
+ 770,
413
  771,
414
  772,
415
  773,
 
422
  786,
423
  789,
424
  790,
425
+ 791,
426
+ 793,
427
  795,
428
  796,
429
+ 797,
430
  799,
431
  800,
432
  801,
433
  802,
434
+ 803,
435
  804,
 
436
  806,
437
  807,
438
  808,
439
+ 809,
440
  810,
441
+ 812,
442
+ 814,
 
443
  816,
444
+ 817,
445
+ 819,
446
  821,
447
+ 823,
448
  824,
449
  826,
450
  828,
451
  830,
452
  832,
453
+ 834,
454
+ 835
455
  ]
456
  }
lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5be40955a039d928c8fdd395fe8e3055482197af1af9d0a3fec1cda0f77c65e5
3
- size 1381777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72880591a0a6b98e895eacb328491d7923cf6c86bd6b3c56a63582e53daa0796
3
+ size 1391005
lemmatizer/trees CHANGED
Binary files a/lemmatizer/trees and b/lemmatizer/trees differ
 
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"da",
3
  "name":"core_news_trf",
4
- "version":"3.3.0",
5
  "description":"Danish transformer pipeline (Maltehb/danish-bert-botxo). Components: transformer, morphologizer, parser, lemmatizer (trainable_lemmatizer), ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
- "spacy_version":">=3.3.0.dev0,<3.4.0",
11
- "spacy_git_version":"849bef2de",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -246,51 +246,51 @@
246
  "token_p":0.9977732598,
247
  "token_r":0.9974835463,
248
  "token_f":0.997628382,
249
- "pos_acc":0.9763184658,
250
- "morph_acc":0.97360647,
251
- "morph_micro_p":0.9874911014,
252
- "morph_micro_r":0.98026349,
253
- "morph_micro_f":0.9838640221,
254
  "morph_per_feat":{
255
  "Mood":{
256
- "p":0.9942638623,
257
- "r":0.9914204004,
258
- "f":0.9928400955
259
  },
260
  "Tense":{
261
- "p":0.9826415094,
262
- "r":0.9804216867,
263
- "f":0.981530343
264
  },
265
  "VerbForm":{
266
- "p":0.9840196681,
267
- "r":0.9798041616,
268
- "f":0.9819073904
269
  },
270
  "Voice":{
271
- "p":0.9940074906,
272
- "r":0.9917787743,
273
- "f":0.9928918818
274
  },
275
  "Definite":{
276
- "p":0.9900039984,
277
- "r":0.9782694587,
278
- "f":0.9841017488
279
  },
280
  "Gender":{
281
- "p":0.979516454,
282
- "r":0.9694250582,
283
- "f":0.97444463
284
  },
285
  "Number":{
286
- "p":0.9889473684,
287
- "r":0.9801773605,
288
- "f":0.9845428347
289
  },
290
  "AdpType":{
291
- "p":0.996460177,
292
- "r":0.9955791335,
293
- "f":0.9960194604
294
  },
295
  "PartType":{
296
  "p":1.0,
@@ -298,19 +298,19 @@
298
  "f":0.9983739837
299
  },
300
  "Case":{
301
- "p":0.992,
302
- "r":0.9794628752,
303
- "f":0.9856915739
304
  },
305
  "Person":{
306
- "p":0.9857397504,
307
- "r":0.9822380107,
308
- "f":0.9839857651
309
  },
310
  "PronType":{
311
- "p":0.9925619835,
312
- "r":0.9876644737,
313
- "f":0.9901071723
314
  },
315
  "NumType":{
316
  "p":0.9865771812,
@@ -318,9 +318,9 @@
318
  "f":0.98
319
  },
320
  "Degree":{
321
- "p":0.9732685298,
322
- "r":0.965060241,
323
- "f":0.9691470054
324
  },
325
  "Reflex":{
326
  "p":1.0,
@@ -343,14 +343,14 @@
343
  "f":0.9942857143
344
  },
345
  "Foreign":{
346
- "p":1.0,
347
- "r":0.6,
348
- "f":0.75
349
  },
350
  "Abbr":{
351
- "p":0.75,
352
- "r":0.6,
353
- "f":0.6666666667
354
  },
355
  "Style":{
356
  "p":1.0,
@@ -358,66 +358,66 @@
358
  "f":1.0
359
  }
360
  },
361
- "sents_p":0.8661971831,
362
- "sents_r":0.8723404255,
363
- "sents_f":0.8692579505,
364
- "dep_uas":0.8620092701,
365
- "dep_las":0.8339289703,
366
  "dep_las_per_type":{
367
  "advmod":{
368
- "p":0.7837078652,
369
- "r":0.7881355932,
370
- "f":0.785915493
371
  },
372
  "root":{
373
- "p":0.8533568905,
374
- "r":0.8563829787,
375
- "f":0.8548672566
376
  },
377
  "nsubj":{
378
- "p":0.8970588235,
379
- "r":0.9008438819,
380
- "f":0.8989473684
381
  },
382
  "case":{
383
- "p":0.9159248269,
384
- "r":0.9132149901,
385
- "f":0.9145679012
386
  },
387
  "obl":{
388
- "p":0.7840375587,
389
- "r":0.7779503106,
390
- "f":0.7809820733
391
  },
392
  "cc":{
393
- "p":0.8529411765,
394
- "r":0.8430232558,
395
- "f":0.8479532164
396
  },
397
  "conj":{
398
- "p":0.7260273973,
399
- "r":0.7066666667,
400
- "f":0.7162162162
401
  },
402
  "obj":{
403
- "p":0.8733944954,
404
- "r":0.9242718447,
405
- "f":0.8981132075
406
  },
407
  "aux":{
408
- "p":0.8837209302,
409
- "r":0.8862973761,
410
- "f":0.885007278
411
  },
412
  "acl:relcl":{
413
- "p":0.7428571429,
414
- "r":0.7027027027,
415
- "f":0.7222222222
416
  },
417
  "advmod:lmod":{
418
- "p":0.7878787879,
419
  "r":0.776119403,
420
- "f":0.7819548872
421
  },
422
  "det":{
423
  "p":0.9169381107,
@@ -430,74 +430,69 @@
430
  "f":0.8620102215
431
  },
432
  "nmod:poss":{
433
- "p":0.7741935484,
434
- "r":0.7128712871,
435
- "f":0.7422680412
436
  },
437
  "ccomp":{
438
- "p":0.6721311475,
439
- "r":0.6612903226,
440
- "f":0.6666666667
441
  },
442
  "nummod":{
443
- "p":0.8130081301,
444
- "r":0.8333333333,
445
- "f":0.8230452675
446
  },
447
  "flat":{
448
- "p":0.825,
449
- "r":0.8741721854,
450
- "f":0.8488745981
451
  },
452
  "compound:prt":{
453
- "p":0.65625,
454
- "r":0.512195122,
455
- "f":0.5753424658
456
  },
457
  "advcl":{
458
- "p":0.6890756303,
459
- "r":0.7068965517,
460
- "f":0.6978723404
461
  },
462
  "mark":{
463
- "p":0.9089026915,
464
- "r":0.9014373717,
465
- "f":0.9051546392
466
  },
467
  "cop":{
468
- "p":0.8532608696,
469
- "r":0.8971428571,
470
- "f":0.8746518106
471
  },
472
  "dep":{
473
- "p":0.2197802198,
474
- "r":0.3773584906,
475
- "f":0.2777777778
476
  },
477
  "nmod":{
478
- "p":0.7321063395,
479
- "r":0.69921875,
480
- "f":0.7152847153
481
  },
482
  "iobj":{
483
  "p":0.9375,
484
  "r":0.6818181818,
485
  "f":0.7894736842
486
  },
487
- "obl:lmod":{
488
- "p":0.0,
489
- "r":0.0,
490
- "f":0.0
491
- },
492
  "xcomp":{
493
- "p":0.5102040816,
494
- "r":0.4237288136,
495
- "f":0.462962963
496
  },
497
  "list":{
498
  "p":0.5,
499
- "r":0.2222222222,
500
- "f":0.3076923077
501
  },
502
  "vocative":{
503
  "p":0.0,
@@ -505,59 +500,64 @@
505
  "f":0.0
506
  },
507
  "fixed":{
508
- "p":0.9166666667,
509
- "r":0.8048780488,
510
- "f":0.8571428571
 
 
 
 
 
511
  },
512
  "expl":{
513
- "p":0.9117647059,
514
  "r":0.9117647059,
515
- "f":0.9117647059
516
- },
517
- "appos":{
518
- "p":0.6,
519
- "r":0.6363636364,
520
- "f":0.6176470588
521
  },
522
  "obl:tmod":{
523
- "p":0.8,
524
- "r":0.4444444444,
525
- "f":0.5714285714
526
  },
527
  "discourse":{
528
  "p":0.0,
529
  "r":0.0,
530
  "f":0.0
 
 
 
 
 
531
  }
532
  },
533
- "lemma_acc":0.9458595642,
534
- "tag_acc":0.9763184658,
535
- "ents_p":0.8106995885,
536
- "ents_r":0.8208333333,
537
- "ents_f":0.8157349896,
538
  "ents_per_type":{
539
  "PER":{
540
- "p":0.8841463415,
541
- "r":0.8734939759,
542
- "f":0.8787878788
543
  },
544
  "ORG":{
545
- "p":0.7093023256,
546
  "r":0.6777777778,
547
- "f":0.6931818182
548
  },
549
  "MISC":{
550
- "p":0.7272727273,
551
  "r":0.7787610619,
552
- "f":0.7521367521
553
  },
554
  "LOC":{
555
- "p":0.8695652174,
556
- "r":0.9009009009,
557
- "f":0.8849557522
558
  }
559
  },
560
- "speed":451.6438624119
561
  },
562
  "sources":[
563
  {
 
1
  {
2
  "lang":"da",
3
  "name":"core_news_trf",
4
+ "version":"3.4.0",
5
  "description":"Danish transformer pipeline (Maltehb/danish-bert-botxo). Components: transformer, morphologizer, parser, lemmatizer (trainable_lemmatizer), ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
+ "spacy_version":">=3.4.0,<3.5.0",
11
+ "spacy_git_version":"dd038b536",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
246
  "token_p":0.9977732598,
247
  "token_r":0.9974835463,
248
  "token_f":0.997628382,
249
+ "pos_acc":0.9746222394,
250
+ "morph_acc":0.971716389,
251
+ "morph_micro_p":0.9871860323,
252
+ "morph_micro_r":0.9760738983,
253
+ "morph_micro_f":0.9815985177,
254
  "morph_per_feat":{
255
  "Mood":{
256
+ "p":0.9923150817,
257
+ "r":0.9847473785,
258
+ "f":0.9885167464
259
  },
260
  "Tense":{
261
+ "p":0.9870525514,
262
+ "r":0.9759036145,
263
+ "f":0.9814464218
264
  },
265
  "VerbForm":{
266
+ "p":0.9863861386,
267
+ "r":0.9755201958,
268
+ "f":0.9809230769
269
  },
270
  "Voice":{
271
+ "p":0.9917293233,
272
+ "r":0.985799701,
273
+ "f":0.9887556222
274
  },
275
  "Definite":{
276
+ "p":0.98915227,
277
+ "r":0.9727380482,
278
+ "f":0.980876494
279
  },
280
  "Gender":{
281
+ "p":0.9797843666,
282
+ "r":0.9664340312,
283
+ "f":0.9730634097
284
  },
285
  "Number":{
286
+ "p":0.9873217116,
287
+ "r":0.9749608764,
288
+ "f":0.9811023622
289
  },
290
  "AdpType":{
291
+ "p":0.9973357016,
292
+ "r":0.9929266136,
293
+ "f":0.9951262738
294
  },
295
  "PartType":{
296
  "p":1.0,
 
298
  "f":0.9983739837
299
  },
300
  "Case":{
301
+ "p":0.9919614148,
302
+ "r":0.9747235387,
303
+ "f":0.9832669323
304
  },
305
  "Person":{
306
+ "p":0.9856630824,
307
+ "r":0.9769094139,
308
+ "f":0.9812667261
309
  },
310
  "PronType":{
311
+ "p":0.9925373134,
312
+ "r":0.984375,
313
+ "f":0.9884393064
314
  },
315
  "NumType":{
316
  "p":0.9865771812,
 
318
  "f":0.98
319
  },
320
  "Degree":{
321
+ "p":0.9697702539,
322
+ "r":0.9662650602,
323
+ "f":0.968014484
324
  },
325
  "Reflex":{
326
  "p":1.0,
 
343
  "f":0.9942857143
344
  },
345
  "Foreign":{
346
+ "p":0.7777777778,
347
+ "r":0.7,
348
+ "f":0.7368421053
349
  },
350
  "Abbr":{
351
+ "p":1.0,
352
+ "r":0.4,
353
+ "f":0.5714285714
354
  },
355
  "Style":{
356
  "p":1.0,
 
358
  "f":1.0
359
  }
360
  },
361
+ "sents_p":0.8160136286,
362
+ "sents_r":0.8492907801,
363
+ "sents_f":0.832319722,
364
+ "dep_uas":0.8596491228,
365
+ "dep_las":0.8301675978,
366
  "dep_las_per_type":{
367
  "advmod":{
368
+ "p":0.7773109244,
369
+ "r":0.7838983051,
370
+ "f":0.7805907173
371
  },
372
  "root":{
373
+ "p":0.8293515358,
374
+ "r":0.8617021277,
375
+ "f":0.8452173913
376
  },
377
  "nsubj":{
378
+ "p":0.8976545842,
379
+ "r":0.888185654,
380
+ "f":0.8928950159
381
  },
382
  "case":{
383
+ "p":0.9175769613,
384
+ "r":0.9112426036,
385
+ "f":0.9143988125
386
  },
387
  "obl":{
388
+ "p":0.7834394904,
389
+ "r":0.7639751553,
390
+ "f":0.7735849057
391
  },
392
  "cc":{
393
+ "p":0.8425655977,
394
+ "r":0.8401162791,
395
+ "f":0.8413391557
396
  },
397
  "conj":{
398
+ "p":0.7154696133,
399
+ "r":0.6906666667,
400
+ "f":0.7028493894
401
  },
402
  "obj":{
403
+ "p":0.8701298701,
404
+ "r":0.9106796117,
405
+ "f":0.889943074
406
  },
407
  "aux":{
408
+ "p":0.8699421965,
409
+ "r":0.8775510204,
410
+ "f":0.8737300435
411
  },
412
  "acl:relcl":{
413
+ "p":0.7630057803,
414
+ "r":0.7135135135,
415
+ "f":0.7374301676
416
  },
417
  "advmod:lmod":{
418
+ "p":0.8,
419
  "r":0.776119403,
420
+ "f":0.7878787879
421
  },
422
  "det":{
423
  "p":0.9169381107,
 
430
  "f":0.8620102215
431
  },
432
  "nmod:poss":{
433
+ "p":0.7765957447,
434
+ "r":0.7227722772,
435
+ "f":0.7487179487
436
  },
437
  "ccomp":{
438
+ "p":0.7586206897,
439
+ "r":0.7096774194,
440
+ "f":0.7333333333
441
  },
442
  "nummod":{
443
+ "p":0.8032786885,
444
+ "r":0.8166666667,
445
+ "f":0.8099173554
446
  },
447
  "flat":{
448
+ "p":0.8364779874,
449
+ "r":0.880794702,
450
+ "f":0.8580645161
451
  },
452
  "compound:prt":{
453
+ "p":0.6666666667,
454
+ "r":0.5365853659,
455
+ "f":0.5945945946
456
  },
457
  "advcl":{
458
+ "p":0.6746031746,
459
+ "r":0.7327586207,
460
+ "f":0.7024793388
461
  },
462
  "mark":{
463
+ "p":0.9010309278,
464
+ "r":0.8973305955,
465
+ "f":0.8991769547
466
  },
467
  "cop":{
468
+ "p":0.8742857143,
469
+ "r":0.8742857143,
470
+ "f":0.8742857143
471
  },
472
  "dep":{
473
+ "p":0.2358490566,
474
+ "r":0.4716981132,
475
+ "f":0.3144654088
476
  },
477
  "nmod":{
478
+ "p":0.7105263158,
479
+ "r":0.685546875,
480
+ "f":0.6978131213
481
  },
482
  "iobj":{
483
  "p":0.9375,
484
  "r":0.6818181818,
485
  "f":0.7894736842
486
  },
 
 
 
 
 
487
  "xcomp":{
488
+ "p":0.6,
489
+ "r":0.406779661,
490
+ "f":0.4848484848
491
  },
492
  "list":{
493
  "p":0.5,
494
+ "r":0.2777777778,
495
+ "f":0.3571428571
496
  },
497
  "vocative":{
498
  "p":0.0,
 
500
  "f":0.0
501
  },
502
  "fixed":{
503
+ "p":0.9444444444,
504
+ "r":0.8292682927,
505
+ "f":0.8831168831
506
+ },
507
+ "appos":{
508
+ "p":0.7142857143,
509
+ "r":0.6060606061,
510
+ "f":0.6557377049
511
  },
512
  "expl":{
513
+ "p":0.9393939394,
514
  "r":0.9117647059,
515
+ "f":0.9253731343
 
 
 
 
 
516
  },
517
  "obl:tmod":{
518
+ "p":0.8333333333,
519
+ "r":0.5555555556,
520
+ "f":0.6666666667
521
  },
522
  "discourse":{
523
  "p":0.0,
524
  "r":0.0,
525
  "f":0.0
526
+ },
527
+ "obl:lmod":{
528
+ "p":0.0,
529
+ "r":0.0,
530
+ "f":0.0
531
  }
532
  },
533
+ "lemma_acc":0.9459564165,
534
+ "tag_acc":0.9746222394,
535
+ "ents_p":0.8118609407,
536
+ "ents_r":0.8270833333,
537
+ "ents_f":0.8194014448,
538
  "ents_per_type":{
539
  "PER":{
540
+ "p":0.9018404908,
541
+ "r":0.8855421687,
542
+ "f":0.8936170213
543
  },
544
  "ORG":{
545
+ "p":0.7721518987,
546
  "r":0.6777777778,
547
+ "f":0.7218934911
548
  },
549
  "MISC":{
550
+ "p":0.6717557252,
551
  "r":0.7787610619,
552
+ "f":0.7213114754
553
  },
554
  "LOC":{
555
+ "p":0.8706896552,
556
+ "r":0.9099099099,
557
+ "f":0.8898678414
558
  }
559
  },
560
+ "speed":4656.9787909711
561
  },
562
  "sources":[
563
  {
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfcee92927fea22e281ff4353f6d9f83987080281d660f2ffa660def49afc778
3
  size 483580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8a3ae82c904aa28889940d9016755ac854a0a9c9afb2df2b70cdcfef1aa05b3
3
  size 483580
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ccf3070c7c563d900cc0aca1bbedfc77218f2913a6c64a7ab6b6eba27b3616f2
3
  size 225962
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:197720aa3b307d6f5848667f84118234ab76bbebbb3c13e69c76a35c3011a940
3
  size 225962
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f59d85e1386120fbc4b9e08a54154b02d6bb9c127f2bd134919f44a440c21d2d
3
  size 460325
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26bac3bcbe1f667cd32dbeb56fa105c836c07793fd807ce05535c65b805f6d31
3
  size 460325
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0bb5cfb40995a176fa623ed9b8ca09994bc9f1958744828841ca99fb6b587375
3
- size 443557620
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baaad1b1983daf896766f03d629faafd62a9e8de1d70f61d0f03553695c46a8a
3
+ size 443557655
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d945b8e51d0aca0dbcd80c35be1423ec2654e6dda61911528209bbe5ddbd18d
3
- size 469391
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:847c6829b856ad53cba8dd709f129df89311d57390c82a164d70c6ed000daa01
3
+ size 469274