adrianeboyd commited on
Commit
5daa22f
1 Parent(s): a56a017

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,62 +14,62 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.7845934379
18
  - name: NER Recall
19
  type: recall
20
- value: 0.7607192254
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.7724719101
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
- value: 0.9538495093
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
- value: 0.9666739368
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
- value: 0.9639000982
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
- value: 0.9568877162
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
- value: 0.8682669641
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
- value: 0.8246685762
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
- value: 0.8765867419
73
  ---
74
  ### Details: https://spacy.io/models/nl#nl_core_news_lg
75
 
@@ -78,8 +78,8 @@ Dutch pipeline optimized for CPU. Components: tok2vec, morphologizer, tagger, pa
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `nl_core_news_lg` |
81
- | **Version** | `3.4.0` |
82
- | **spaCy** | `>=3.4.0,<3.5.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 500000 keys, 500000 unique vectors (300 dimensions) |
@@ -106,22 +106,22 @@ Dutch pipeline optimized for CPU. Components: tok2vec, morphologizer, tagger, pa
106
 
107
  | Type | Score |
108
  | --- | --- |
109
- | `TAG_ACC` | 95.38 |
110
- | `SENTS_P` | 86.20 |
111
- | `SENTS_R` | 89.17 |
112
- | `SENTS_F` | 87.66 |
113
- | `DEP_UAS` | 86.83 |
114
- | `DEP_LAS` | 82.47 |
115
- | `ENTS_P` | 78.46 |
116
- | `ENTS_R` | 76.07 |
117
- | `ENTS_F` | 77.25 |
118
- | `TOKEN_ACC` | 99.97 |
119
  | `TOKEN_P` | 99.74 |
120
  | `TOKEN_R` | 99.76 |
121
  | `TOKEN_F` | 99.75 |
122
- | `POS_ACC` | 96.67 |
123
- | `MORPH_ACC` | 96.39 |
124
- | `MORPH_MICRO_P` | 97.41 |
125
- | `MORPH_MICRO_R` | 95.71 |
126
- | `MORPH_MICRO_F` | 96.56 |
127
- | `LEMMA_ACC` | 95.69 |
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.7850940666
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.7503457815
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.7673267327
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.9514067612
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
+ value: 0.9638822246
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
+ value: 0.9628967172
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
+ value: 0.9556229147
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
+ value: 0.8702417761
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
+ value: 0.8253421186
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
+ value: 0.8731501057
73
  ---
74
  ### Details: https://spacy.io/models/nl#nl_core_news_lg
75
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `nl_core_news_lg` |
81
+ | **Version** | `3.5.0` |
82
+ | **spaCy** | `>=3.5.0,<3.6.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `tagger`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 500000 keys, 500000 unique vectors (300 dimensions) |
106
 
107
  | Type | Score |
108
  | --- | --- |
109
+ | `TAG_ACC` | 95.14 |
110
+ | `SENTS_P` | 85.80 |
111
+ | `SENTS_R` | 88.88 |
112
+ | `SENTS_F` | 87.32 |
113
+ | `DEP_UAS` | 87.02 |
114
+ | `DEP_LAS` | 82.53 |
115
+ | `ENTS_P` | 78.51 |
116
+ | `ENTS_R` | 75.03 |
117
+ | `ENTS_F` | 76.73 |
118
+ | `TOKEN_ACC` | 99.94 |
119
  | `TOKEN_P` | 99.74 |
120
  | `TOKEN_R` | 99.76 |
121
  | `TOKEN_F` | 99.75 |
122
+ | `POS_ACC` | 96.39 |
123
+ | `MORPH_ACC` | 96.29 |
124
+ | `MORPH_MICRO_P` | 97.12 |
125
+ | `MORPH_MICRO_R` | 95.47 |
126
+ | `MORPH_MICRO_F` | 96.29 |
127
+ | `LEMMA_ACC` | 95.56 |
accuracy.json CHANGED
@@ -1,191 +1,196 @@
1
  {
2
- "tag_acc": 0.9538495093,
3
- "sents_p": 0.8619972261,
4
- "sents_r": 0.8916786227,
5
- "sents_f": 0.8765867419,
6
- "dep_uas": 0.8682669641,
7
- "dep_las": 0.8246685762,
8
  "dep_las_per_type": {
9
  "nmod:poss": {
10
- "p": 0.9522058824,
11
- "r": 0.9452554745,
12
- "f": 0.9487179487
13
  },
14
  "nsubj": {
15
- "p": 0.8483072917,
16
- "r": 0.8566732413,
17
- "f": 0.8524697416
18
  },
19
  "aux": {
20
- "p": 0.9150326797,
21
- "r": 0.9210526316,
22
- "f": 0.9180327869
23
  },
24
  "advmod": {
25
- "p": 0.7968337731,
26
- "r": 0.8089285714,
27
- "f": 0.8028356225
28
  },
29
  "root": {
30
- "p": 0.8689320388,
31
- "r": 0.8988522238,
32
- "f": 0.8836389281
33
  },
34
  "det": {
35
- "p": 0.9430724152,
36
- "r": 0.9749026395,
37
- "f": 0.9587234043
38
  },
39
  "amod": {
40
- "p": 0.8828193833,
41
  "r": 0.8978494624,
42
- "f": 0.8902709907
43
  },
44
  "obl": {
45
- "p": 0.7610619469,
46
- "r": 0.7569397427,
47
- "f": 0.7589952478
48
  },
49
  "mark": {
50
- "p": 0.8918918919,
51
- "r": 0.9,
52
- "f": 0.8959276018
53
  },
54
  "ccomp": {
55
- "p": 0.6979166667,
56
- "r": 0.6261682243,
57
- "f": 0.6600985222
58
  },
59
  "case": {
60
- "p": 0.9368811881,
61
- "r": 0.9618805591,
62
- "f": 0.9492163009
63
  },
64
  "appos": {
65
- "p": 0.707165109,
66
- "r": 0.6878787879,
67
- "f": 0.6973886329
68
  },
69
  "obj": {
70
- "p": 0.7573529412,
71
- "r": 0.786259542,
72
- "f": 0.7715355805
73
  },
74
  "compound:prt": {
75
- "p": 0.7692307692,
76
- "r": 0.7042253521,
77
- "f": 0.7352941176
78
  },
79
  "xcomp": {
80
- "p": 0.6642599278,
81
- "r": 0.6690909091,
82
- "f": 0.6666666667
83
  },
84
  "flat": {
85
- "p": 0.8215527231,
86
- "r": 0.7518557794,
87
- "f": 0.7851605759
88
  },
89
  "expl:pv": {
90
- "p": 0.7619047619,
91
  "r": 0.7272727273,
92
- "f": 0.7441860465
93
  },
94
  "acl": {
95
- "p": 0.4404761905,
96
- "r": 0.3775510204,
97
- "f": 0.4065934066
98
  },
99
  "advcl": {
100
- "p": 0.5577889447,
101
- "r": 0.5,
102
- "f": 0.5273159145
103
  },
104
  "nummod": {
105
- "p": 0.8291139241,
106
- "r": 0.8733333333,
107
- "f": 0.8506493506
108
  },
109
  "nmod": {
110
- "p": 0.7201986755,
111
  "r": 0.7565217391,
112
- "f": 0.737913486
113
  },
114
  "cc": {
115
- "p": 0.8536585366,
116
- "r": 0.8617424242,
117
- "f": 0.8576814326
118
  },
119
  "conj": {
120
- "p": 0.6527777778,
121
- "r": 0.6385869565,
122
- "f": 0.6456043956
123
  },
124
  "nsubj:pass": {
125
- "p": 0.8128654971,
126
- "r": 0.8742138365,
127
- "f": 0.8424242424
128
  },
129
  "aux:pass": {
130
- "p": 0.9095744681,
131
- "r": 0.95,
132
- "f": 0.9293478261
133
  },
134
- "cop": {
135
- "p": 0.7900355872,
136
- "r": 0.8131868132,
137
- "f": 0.8014440433
138
  },
139
- "parataxis": {
140
- "p": 0.3349282297,
141
- "r": 0.2536231884,
142
- "f": 0.2886597938
143
  },
144
  "acl:relcl": {
145
- "p": 0.701863354,
146
- "r": 0.7106918239,
147
- "f": 0.70625
148
  },
149
- "expl": {
150
- "p": 0.4166666667,
151
- "r": 0.4761904762,
152
- "f": 0.4444444444
153
  },
154
- "iobj": {
155
- "p": 0.6470588235,
156
- "r": 0.3333333333,
157
- "f": 0.44
158
  },
159
  "fixed": {
160
- "p": 0.7255434783,
161
- "r": 0.4828209765,
162
- "f": 0.5798045603
163
  },
164
  "obl:agent": {
165
- "p": 0.8387096774,
166
  "r": 0.8965517241,
167
- "f": 0.8666666667
168
  },
169
  "csubj": {
170
- "p": 0.45,
171
  "r": 0.45,
172
- "f": 0.45
173
  },
174
- "dep": {
175
  "p": 0.0,
176
  "r": 0.0,
177
  "f": 0.0
178
  },
179
- "orphan": {
180
  "p": 0.0,
181
  "r": 0.0,
182
  "f": 0.0
183
  }
184
  },
185
- "ents_p": 0.7845934379,
186
- "ents_r": 0.7607192254,
187
- "ents_f": 0.7724719101,
188
  "ents_per_type": {
 
 
 
 
 
189
  "PERSON": {
190
  "p": 0.0,
191
  "r": 0.0,
@@ -211,132 +216,127 @@
211
  "r": 0.0,
212
  "f": 0.0
213
  },
214
- "WORK_OF_ART": {
215
- "p": 0.0,
216
- "r": 0.0,
217
- "f": 0.0
218
- },
219
- "PRODUCT": {
220
  "p": 0.0,
221
  "r": 0.0,
222
  "f": 0.0
223
  },
224
- "EVENT": {
225
  "p": 0.0,
226
  "r": 0.0,
227
  "f": 0.0
228
  },
229
- "NORP": {
230
  "p": 0.0,
231
  "r": 0.0,
232
  "f": 0.0
233
  },
234
- "DATE": {
235
  "p": 0.0,
236
  "r": 0.0,
237
  "f": 0.0
238
  },
239
- "ORDINAL": {
240
  "p": 0.0,
241
  "r": 0.0,
242
  "f": 0.0
243
  },
244
- "LANGUAGE": {
245
  "p": 0.0,
246
  "r": 0.0,
247
  "f": 0.0
248
  },
249
- "TIME": {
250
  "p": 0.0,
251
  "r": 0.0,
252
  "f": 0.0
253
  },
254
- "PERCENT": {
255
  "p": 0.0,
256
  "r": 0.0,
257
  "f": 0.0
258
  },
259
- "LOC": {
260
  "p": 0.0,
261
  "r": 0.0,
262
  "f": 0.0
263
  },
264
- "FAC": {
265
  "p": 0.0,
266
  "r": 0.0,
267
  "f": 0.0
268
  },
269
- "MONEY": {
270
  "p": 0.0,
271
  "r": 0.0,
272
  "f": 0.0
273
  },
274
- "LAW": {
275
  "p": 0.0,
276
  "r": 0.0,
277
  "f": 0.0
278
  }
279
  },
280
- "speed": 10089.2857654723,
281
- "token_acc": 0.9997165842,
282
  "token_p": 0.9974281853,
283
  "token_r": 0.9975586363,
284
  "token_f": 0.9974934066,
285
- "pos_acc": 0.9666739368,
286
- "morph_acc": 0.9639000982,
287
- "morph_micro_p": 0.9741415265,
288
- "morph_micro_r": 0.9571096845,
289
- "morph_micro_f": 0.965550503,
290
  "morph_per_feat": {
291
  "Person": {
292
- "p": 0.994157741,
293
- "r": 0.9760994264,
294
- "f": 0.9850458273
295
  },
296
  "Poss": {
297
- "p": 0.9886363636,
298
- "r": 1.0,
299
- "f": 0.9942857143
300
  },
301
  "PronType": {
302
- "p": 0.9914965986,
303
- "r": 0.9692435578,
304
- "f": 0.9802437999
305
  },
306
  "Gender": {
307
- "p": 0.9321944809,
308
- "r": 0.9023149326,
309
- "f": 0.9170113754
310
  },
311
  "Number": {
312
- "p": 0.9844227245,
313
- "r": 0.9648256249,
314
- "f": 0.9745256633
315
  },
316
  "Tense": {
317
- "p": 0.9838530067,
318
- "r": 0.9714128642,
319
- "f": 0.977593361
320
  },
321
  "VerbForm": {
322
- "p": 0.9687726943,
323
- "r": 0.9600575747,
324
- "f": 0.9643954455
325
  },
326
  "Degree": {
327
- "p": 0.9598246896,
328
- "r": 0.9439655172,
329
- "f": 0.9518290474
330
  },
331
  "Definite": {
332
- "p": 0.9964757709,
333
- "r": 0.9955985915,
334
- "f": 0.9960369881
335
  },
336
  "Case": {
337
- "p": 0.998003992,
338
- "r": 0.9960159363,
339
- "f": 0.9970089731
340
  },
341
  "Reflex": {
342
  "p": 1.0,
@@ -349,5 +349,5 @@
349
  "f": 0.7142857143
350
  }
351
  },
352
- "lemma_acc": 0.9568877162
353
  }
1
  {
2
+ "tag_acc": 0.9514067612,
3
+ "sents_p": 0.858033241,
4
+ "sents_r": 0.8888091822,
5
+ "sents_f": 0.8731501057,
6
+ "dep_uas": 0.8702417761,
7
+ "dep_las": 0.8253421186,
8
  "dep_las_per_type": {
9
  "nmod:poss": {
10
+ "p": 0.9448529412,
11
+ "r": 0.9379562044,
12
+ "f": 0.9413919414
13
  },
14
  "nsubj": {
15
+ "p": 0.8506493506,
16
+ "r": 0.8612754767,
17
+ "f": 0.8559294348
18
  },
19
  "aux": {
20
+ "p": 0.8942307692,
21
+ "r": 0.9177631579,
22
+ "f": 0.9058441558
23
  },
24
  "advmod": {
25
+ "p": 0.7902097902,
26
+ "r": 0.8071428571,
27
+ "f": 0.7985865724
28
  },
29
  "root": {
30
+ "p": 0.875952876,
31
+ "r": 0.9067431851,
32
+ "f": 0.891082129
33
  },
34
  "det": {
35
+ "p": 0.9426057813,
36
+ "r": 0.9736045002,
37
+ "f": 0.9578544061
38
  },
39
  "amod": {
40
+ "p": 0.8789473684,
41
  "r": 0.8978494624,
42
+ "f": 0.8882978723
43
  },
44
  "obl": {
45
+ "p": 0.7619367855,
46
+ "r": 0.7670954638,
47
+ "f": 0.7645074224
48
  },
49
  "mark": {
50
+ "p": 0.9007220217,
51
+ "r": 0.9072727273,
52
+ "f": 0.9039855072
53
  },
54
  "ccomp": {
55
+ "p": 0.7,
56
+ "r": 0.6542056075,
57
+ "f": 0.6763285024
58
  },
59
  "case": {
60
+ "p": 0.9373703857,
61
+ "r": 0.9572215163,
62
+ "f": 0.9471919531
63
  },
64
  "appos": {
65
+ "p": 0.7391304348,
66
+ "r": 0.7212121212,
67
+ "f": 0.7300613497
68
  },
69
  "obj": {
70
+ "p": 0.7731343284,
71
+ "r": 0.7908396947,
72
+ "f": 0.7818867925
73
  },
74
  "compound:prt": {
75
+ "p": 0.7736842105,
76
+ "r": 0.6901408451,
77
+ "f": 0.729528536
78
  },
79
  "xcomp": {
80
+ "p": 0.6559139785,
81
+ "r": 0.6654545455,
82
+ "f": 0.6606498195
83
  },
84
  "flat": {
85
+ "p": 0.7821782178,
86
+ "r": 0.7539766702,
87
+ "f": 0.7678185745
88
  },
89
  "expl:pv": {
90
+ "p": 0.8,
91
  "r": 0.7272727273,
92
+ "f": 0.7619047619
93
  },
94
  "acl": {
95
+ "p": 0.5373134328,
96
+ "r": 0.3673469388,
97
+ "f": 0.4363636364
98
  },
99
  "advcl": {
100
+ "p": 0.4953271028,
101
+ "r": 0.4774774775,
102
+ "f": 0.4862385321
103
  },
104
  "nummod": {
105
+ "p": 0.798136646,
106
+ "r": 0.8566666667,
107
+ "f": 0.8263665595
108
  },
109
  "nmod": {
110
+ "p": 0.7304785894,
111
  "r": 0.7565217391,
112
+ "f": 0.7432721059
113
  },
114
  "cc": {
115
+ "p": 0.8598484848,
116
+ "r": 0.8598484848,
117
+ "f": 0.8598484848
118
  },
119
  "conj": {
120
+ "p": 0.6921985816,
121
+ "r": 0.6630434783,
122
+ "f": 0.6773074254
123
  },
124
  "nsubj:pass": {
125
+ "p": 0.8333333333,
126
+ "r": 0.8490566038,
127
+ "f": 0.8411214953
128
  },
129
  "aux:pass": {
130
+ "p": 0.8918918919,
131
+ "r": 0.9166666667,
132
+ "f": 0.904109589
133
  },
134
+ "iobj": {
135
+ "p": 0.5416666667,
136
+ "r": 0.3939393939,
137
+ "f": 0.4561403509
138
  },
139
+ "cop": {
140
+ "p": 0.7738515901,
141
+ "r": 0.8021978022,
142
+ "f": 0.7877697842
143
  },
144
  "acl:relcl": {
145
+ "p": 0.7142857143,
146
+ "r": 0.7232704403,
147
+ "f": 0.71875
148
  },
149
+ "parataxis": {
150
+ "p": 0.3971291866,
151
+ "r": 0.3007246377,
152
+ "f": 0.3422680412
153
  },
154
+ "expl": {
155
+ "p": 0.44,
156
+ "r": 0.5238095238,
157
+ "f": 0.4782608696
158
  },
159
  "fixed": {
160
+ "p": 0.676056338,
161
+ "r": 0.4339963834,
162
+ "f": 0.5286343612
163
  },
164
  "obl:agent": {
165
+ "p": 0.962962963,
166
  "r": 0.8965517241,
167
+ "f": 0.9285714286
168
  },
169
  "csubj": {
170
+ "p": 0.5625,
171
  "r": 0.45,
172
+ "f": 0.5
173
  },
174
+ "orphan": {
175
  "p": 0.0,
176
  "r": 0.0,
177
  "f": 0.0
178
  },
179
+ "dep": {
180
  "p": 0.0,
181
  "r": 0.0,
182
  "f": 0.0
183
  }
184
  },
185
+ "ents_p": 0.7850940666,
186
+ "ents_r": 0.7503457815,
187
+ "ents_f": 0.7673267327,
188
  "ents_per_type": {
189
+ "DATE": {
190
+ "p": 0.0,
191
+ "r": 0.0,
192
+ "f": 0.0
193
+ },
194
  "PERSON": {
195
  "p": 0.0,
196
  "r": 0.0,
216
  "r": 0.0,
217
  "f": 0.0
218
  },
219
+ "EVENT": {
 
 
 
 
 
220
  "p": 0.0,
221
  "r": 0.0,
222
  "f": 0.0
223
  },
224
+ "NORP": {
225
  "p": 0.0,
226
  "r": 0.0,
227
  "f": 0.0
228
  },
229
+ "ORDINAL": {
230
  "p": 0.0,
231
  "r": 0.0,
232
  "f": 0.0
233
  },
234
+ "LANGUAGE": {
235
  "p": 0.0,
236
  "r": 0.0,
237
  "f": 0.0
238
  },
239
+ "FAC": {
240
  "p": 0.0,
241
  "r": 0.0,
242
  "f": 0.0
243
  },
244
+ "WORK_OF_ART": {
245
  "p": 0.0,
246
  "r": 0.0,
247
  "f": 0.0
248
  },
249
+ "LOC": {
250
  "p": 0.0,
251
  "r": 0.0,
252
  "f": 0.0
253
  },
254
+ "PRODUCT": {
255
  "p": 0.0,
256
  "r": 0.0,
257
  "f": 0.0
258
  },
259
+ "MONEY": {
260
  "p": 0.0,
261
  "r": 0.0,
262
  "f": 0.0
263
  },
264
+ "TIME": {
265
  "p": 0.0,
266
  "r": 0.0,
267
  "f": 0.0
268
  },
269
+ "LAW": {
270
  "p": 0.0,
271
  "r": 0.0,
272
  "f": 0.0
273
  },
274
+ "PERCENT": {
275
  "p": 0.0,
276
  "r": 0.0,
277
  "f": 0.0
278
  }
279
  },
280
+ "speed": 10878.7516353688,
281
+ "token_acc": 0.999433329,
282
  "token_p": 0.9974281853,
283
  "token_r": 0.9975586363,
284
  "token_f": 0.9974934066,
285
+ "pos_acc": 0.9638822246,
286
+ "morph_acc": 0.9628967172,
287
+ "morph_micro_p": 0.9711903659,
288
+ "morph_micro_r": 0.9546965351,
289
+ "morph_micro_f": 0.9628728216,
290
  "morph_per_feat": {
291
  "Person": {
292
+ "p": 0.9912280702,
293
+ "r": 0.9722753346,
294
+ "f": 0.9816602317
295
  },
296
  "Poss": {
297
+ "p": 0.992248062,
298
+ "r": 0.9808429119,
299
+ "f": 0.9865125241
300
  },
301
  "PronType": {
302
+ "p": 0.989787234,
303
+ "r": 0.9667497922,
304
+ "f": 0.9781328848
305
  },
306
  "Gender": {
307
+ "p": 0.9335968379,
308
+ "r": 0.9012973798,
309
+ "f": 0.9171628268
310
  },
311
  "Number": {
312
+ "p": 0.980195003,
313
+ "r": 0.9630294866,
314
+ "f": 0.9715364288
315
  },
316
  "Tense": {
317
+ "p": 0.9724517906,
318
+ "r": 0.970313359,
319
+ "f": 0.9713813979
320
  },
321
  "VerbForm": {
322
+ "p": 0.9609261939,
323
+ "r": 0.9557394746,
324
+ "f": 0.9583258163
325
  },
326
  "Degree": {
327
+ "p": 0.9626099707,
328
+ "r": 0.9432471264,
329
+ "f": 0.9528301887
330
  },
331
  "Definite": {
332
+ "p": 0.9973439575,
333
+ "r": 0.9916373239,
334
+ "f": 0.9944824542
335
  },
336
  "Case": {
337
+ "p": 0.996007984,
338
+ "r": 0.9940239044,
339
+ "f": 0.9950149551
340
  },
341
  "Reflex": {
342
  "p": 1.0,
349
  "f": 0.7142857143
350
  }
351
  },
352
+ "lemma_acc": 0.9556229147
353
  }
config.cfg CHANGED
@@ -81,8 +81,8 @@ nO = null
81
  [components.ner.model.tok2vec.embed]
82
  @architectures = "spacy.MultiHashEmbed.v2"
83
  width = 96
84
- attrs = ["NORM","PREFIX","SUFFIX","SHAPE","SPACY"]
85
- rows = [5000,1000,2500,2500,50]
86
  include_static_vectors = true
87
 
88
  [components.ner.model.tok2vec.encode]
@@ -166,8 +166,8 @@ factory = "tok2vec"
166
  [components.tok2vec.model.embed]
167
  @architectures = "spacy.MultiHashEmbed.v2"
168
  width = ${components.tok2vec.model.encode:width}
169
- attrs = ["NORM","PREFIX","SUFFIX","SHAPE","SPACY"]
170
- rows = [5000,1000,2500,2500,50]
171
  include_static_vectors = true
172
 
173
  [components.tok2vec.model.encode]
@@ -209,6 +209,7 @@ eval_frequency = 1000
209
  frozen_components = []
210
  before_to_disk = null
211
  annotating_components = []
 
212
 
213
  [training.batcher]
214
  @batchers = "spacy.batch_by_words.v1"
81
  [components.ner.model.tok2vec.embed]
82
  @architectures = "spacy.MultiHashEmbed.v2"
83
  width = 96
84
+ attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
85
+ rows = [5000,1000,2500,2500]
86
  include_static_vectors = true
87
 
88
  [components.ner.model.tok2vec.encode]
166
  [components.tok2vec.model.embed]
167
  @architectures = "spacy.MultiHashEmbed.v2"
168
  width = ${components.tok2vec.model.encode:width}
169
+ attrs = ["NORM","PREFIX","SUFFIX","SHAPE","SPACY","IS_SPACE"]
170
+ rows = [5000,1000,2500,2500,50,50]
171
  include_static_vectors = true
172
 
173
  [components.tok2vec.model.encode]
209
  frozen_components = []
210
  before_to_disk = null
211
  annotating_components = []
212
+ before_update = null
213
 
214
  [training.batcher]
215
  @batchers = "spacy.batch_by_words.v1"
lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1187f468c84c03816a17d6c97a314c5cbaaa30b602717f50a7b7184431b285b
3
  size 408618
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a825038de2a3a544f5ddacc8b12267d14a7abfca221f6952a16576e54b25ca6c
3
  size 408618
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"nl",
3
  "name":"core_news_lg",
4
- "version":"3.4.0",
5
  "description":"Dutch pipeline optimized for CPU. Components: tok2vec, morphologizer, tagger, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
- "spacy_version":">=3.4.0,<3.5.0",
11
- "spacy_git_version":"dd038b536",
12
  "vectors":{
13
  "width":300,
14
  "vectors":500000,
@@ -377,193 +377,198 @@
377
  "senter"
378
  ],
379
  "performance":{
380
- "tag_acc":0.9538495093,
381
- "sents_p":0.8619972261,
382
- "sents_r":0.8916786227,
383
- "sents_f":0.8765867419,
384
- "dep_uas":0.8682669641,
385
- "dep_las":0.8246685762,
386
  "dep_las_per_type":{
387
  "nmod:poss":{
388
- "p":0.9522058824,
389
- "r":0.9452554745,
390
- "f":0.9487179487
391
  },
392
  "nsubj":{
393
- "p":0.8483072917,
394
- "r":0.8566732413,
395
- "f":0.8524697416
396
  },
397
  "aux":{
398
- "p":0.9150326797,
399
- "r":0.9210526316,
400
- "f":0.9180327869
401
  },
402
  "advmod":{
403
- "p":0.7968337731,
404
- "r":0.8089285714,
405
- "f":0.8028356225
406
  },
407
  "root":{
408
- "p":0.8689320388,
409
- "r":0.8988522238,
410
- "f":0.8836389281
411
  },
412
  "det":{
413
- "p":0.9430724152,
414
- "r":0.9749026395,
415
- "f":0.9587234043
416
  },
417
  "amod":{
418
- "p":0.8828193833,
419
  "r":0.8978494624,
420
- "f":0.8902709907
421
  },
422
  "obl":{
423
- "p":0.7610619469,
424
- "r":0.7569397427,
425
- "f":0.7589952478
426
  },
427
  "mark":{
428
- "p":0.8918918919,
429
- "r":0.9,
430
- "f":0.8959276018
431
  },
432
  "ccomp":{
433
- "p":0.6979166667,
434
- "r":0.6261682243,
435
- "f":0.6600985222
436
  },
437
  "case":{
438
- "p":0.9368811881,
439
- "r":0.9618805591,
440
- "f":0.9492163009
441
  },
442
  "appos":{
443
- "p":0.707165109,
444
- "r":0.6878787879,
445
- "f":0.6973886329
446
  },
447
  "obj":{
448
- "p":0.7573529412,
449
- "r":0.786259542,
450
- "f":0.7715355805
451
  },
452
  "compound:prt":{
453
- "p":0.7692307692,
454
- "r":0.7042253521,
455
- "f":0.7352941176
456
  },
457
  "xcomp":{
458
- "p":0.6642599278,
459
- "r":0.6690909091,
460
- "f":0.6666666667
461
  },
462
  "flat":{
463
- "p":0.8215527231,
464
- "r":0.7518557794,
465
- "f":0.7851605759
466
  },
467
  "expl:pv":{
468
- "p":0.7619047619,
469
  "r":0.7272727273,
470
- "f":0.7441860465
471
  },
472
  "acl":{
473
- "p":0.4404761905,
474
- "r":0.3775510204,
475
- "f":0.4065934066
476
  },
477
  "advcl":{
478
- "p":0.5577889447,
479
- "r":0.5,
480
- "f":0.5273159145
481
  },
482
  "nummod":{
483
- "p":0.8291139241,
484
- "r":0.8733333333,
485
- "f":0.8506493506
486
  },
487
  "nmod":{
488
- "p":0.7201986755,
489
  "r":0.7565217391,
490
- "f":0.737913486
491
  },
492
  "cc":{
493
- "p":0.8536585366,
494
- "r":0.8617424242,
495
- "f":0.8576814326
496
  },
497
  "conj":{
498
- "p":0.6527777778,
499
- "r":0.6385869565,
500
- "f":0.6456043956
501
  },
502
  "nsubj:pass":{
503
- "p":0.8128654971,
504
- "r":0.8742138365,
505
- "f":0.8424242424
506
  },
507
  "aux:pass":{
508
- "p":0.9095744681,
509
- "r":0.95,
510
- "f":0.9293478261
511
  },
512
- "cop":{
513
- "p":0.7900355872,
514
- "r":0.8131868132,
515
- "f":0.8014440433
516
  },
517
- "parataxis":{
518
- "p":0.3349282297,
519
- "r":0.2536231884,
520
- "f":0.2886597938
521
  },
522
  "acl:relcl":{
523
- "p":0.701863354,
524
- "r":0.7106918239,
525
- "f":0.70625
526
  },
527
- "expl":{
528
- "p":0.4166666667,
529
- "r":0.4761904762,
530
- "f":0.4444444444
531
  },
532
- "iobj":{
533
- "p":0.6470588235,
534
- "r":0.3333333333,
535
- "f":0.44
536
  },
537
  "fixed":{
538
- "p":0.7255434783,
539
- "r":0.4828209765,
540
- "f":0.5798045603
541
  },
542
  "obl:agent":{
543
- "p":0.8387096774,
544
  "r":0.8965517241,
545
- "f":0.8666666667
546
  },
547
  "csubj":{
548
- "p":0.45,
549
  "r":0.45,
550
- "f":0.45
551
  },
552
- "dep":{
553
  "p":0.0,
554
  "r":0.0,
555
  "f":0.0
556
  },
557
- "orphan":{
558
  "p":0.0,
559
  "r":0.0,
560
  "f":0.0
561
  }
562
  },
563
- "ents_p":0.7845934379,
564
- "ents_r":0.7607192254,
565
- "ents_f":0.7724719101,
566
  "ents_per_type":{
 
 
 
 
 
567
  "PERSON":{
568
  "p":0.0,
569
  "r":0.0,
@@ -589,132 +594,127 @@
589
  "r":0.0,
590
  "f":0.0
591
  },
592
- "WORK_OF_ART":{
593
- "p":0.0,
594
- "r":0.0,
595
- "f":0.0
596
- },
597
- "PRODUCT":{
598
  "p":0.0,
599
  "r":0.0,
600
  "f":0.0
601
  },
602
- "EVENT":{
603
  "p":0.0,
604
  "r":0.0,
605
  "f":0.0
606
  },
607
- "NORP":{
608
  "p":0.0,
609
  "r":0.0,
610
  "f":0.0
611
  },
612
- "DATE":{
613
  "p":0.0,
614
  "r":0.0,
615
  "f":0.0
616
  },
617
- "ORDINAL":{
618
  "p":0.0,
619
  "r":0.0,
620
  "f":0.0
621
  },
622
- "LANGUAGE":{
623
  "p":0.0,
624
  "r":0.0,
625
  "f":0.0
626
  },
627
- "TIME":{
628
  "p":0.0,
629
  "r":0.0,
630
  "f":0.0
631
  },
632
- "PERCENT":{
633
  "p":0.0,
634
  "r":0.0,
635
  "f":0.0
636
  },
637
- "LOC":{
638
  "p":0.0,
639
  "r":0.0,
640
  "f":0.0
641
  },
642
- "FAC":{
643
  "p":0.0,
644
  "r":0.0,
645
  "f":0.0
646
  },
647
- "MONEY":{
648
  "p":0.0,
649
  "r":0.0,
650
  "f":0.0
651
  },
652
- "LAW":{
653
  "p":0.0,
654
  "r":0.0,
655
  "f":0.0
656
  }
657
  },
658
- "speed":10089.2857654723,
659
- "token_acc":0.9997165842,
660
  "token_p":0.9974281853,
661
  "token_r":0.9975586363,
662
  "token_f":0.9974934066,
663
- "pos_acc":0.9666739368,
664
- "morph_acc":0.9639000982,
665
- "morph_micro_p":0.9741415265,
666
- "morph_micro_r":0.9571096845,
667
- "morph_micro_f":0.965550503,
668
  "morph_per_feat":{
669
  "Person":{
670
- "p":0.994157741,
671
- "r":0.9760994264,
672
- "f":0.9850458273
673
  },
674
  "Poss":{
675
- "p":0.9886363636,
676
- "r":1.0,
677
- "f":0.9942857143
678
  },
679
  "PronType":{
680
- "p":0.9914965986,
681
- "r":0.9692435578,
682
- "f":0.9802437999
683
  },
684
  "Gender":{
685
- "p":0.9321944809,
686
- "r":0.9023149326,
687
- "f":0.9170113754
688
  },
689
  "Number":{
690
- "p":0.9844227245,
691
- "r":0.9648256249,
692
- "f":0.9745256633
693
  },
694
  "Tense":{
695
- "p":0.9838530067,
696
- "r":0.9714128642,
697
- "f":0.977593361
698
  },
699
  "VerbForm":{
700
- "p":0.9687726943,
701
- "r":0.9600575747,
702
- "f":0.9643954455
703
  },
704
  "Degree":{
705
- "p":0.9598246896,
706
- "r":0.9439655172,
707
- "f":0.9518290474
708
  },
709
  "Definite":{
710
- "p":0.9964757709,
711
- "r":0.9955985915,
712
- "f":0.9960369881
713
  },
714
  "Case":{
715
- "p":0.998003992,
716
- "r":0.9960159363,
717
- "f":0.9970089731
718
  },
719
  "Reflex":{
720
  "p":1.0,
@@ -727,7 +727,7 @@
727
  "f":0.7142857143
728
  }
729
  },
730
- "lemma_acc":0.9568877162
731
  },
732
  "sources":[
733
  {
1
  {
2
  "lang":"nl",
3
  "name":"core_news_lg",
4
+ "version":"3.5.0",
5
  "description":"Dutch pipeline optimized for CPU. Components: tok2vec, morphologizer, tagger, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
+ "spacy_version":">=3.5.0,<3.6.0",
11
+ "spacy_git_version":"9e0322de1",
12
  "vectors":{
13
  "width":300,
14
  "vectors":500000,
377
  "senter"
378
  ],
379
  "performance":{
380
+ "tag_acc":0.9514067612,
381
+ "sents_p":0.858033241,
382
+ "sents_r":0.8888091822,
383
+ "sents_f":0.8731501057,
384
+ "dep_uas":0.8702417761,
385
+ "dep_las":0.8253421186,
386
  "dep_las_per_type":{
387
  "nmod:poss":{
388
+ "p":0.9448529412,
389
+ "r":0.9379562044,
390
+ "f":0.9413919414
391
  },
392
  "nsubj":{
393
+ "p":0.8506493506,
394
+ "r":0.8612754767,
395
+ "f":0.8559294348
396
  },
397
  "aux":{
398
+ "p":0.8942307692,
399
+ "r":0.9177631579,
400
+ "f":0.9058441558
401
  },
402
  "advmod":{
403
+ "p":0.7902097902,
404
+ "r":0.8071428571,
405
+ "f":0.7985865724
406
  },
407
  "root":{
408
+ "p":0.875952876,
409
+ "r":0.9067431851,
410
+ "f":0.891082129
411
  },
412
  "det":{
413
+ "p":0.9426057813,
414
+ "r":0.9736045002,
415
+ "f":0.9578544061
416
  },
417
  "amod":{
418
+ "p":0.8789473684,
419
  "r":0.8978494624,
420
+ "f":0.8882978723
421
  },
422
  "obl":{
423
+ "p":0.7619367855,
424
+ "r":0.7670954638,
425
+ "f":0.7645074224
426
  },
427
  "mark":{
428
+ "p":0.9007220217,
429
+ "r":0.9072727273,
430
+ "f":0.9039855072
431
  },
432
  "ccomp":{
433
+ "p":0.7,
434
+ "r":0.6542056075,
435
+ "f":0.6763285024
436
  },
437
  "case":{
438
+ "p":0.9373703857,
439
+ "r":0.9572215163,
440
+ "f":0.9471919531
441
  },
442
  "appos":{
443
+ "p":0.7391304348,
444
+ "r":0.7212121212,
445
+ "f":0.7300613497
446
  },
447
  "obj":{
448
+ "p":0.7731343284,
449
+ "r":0.7908396947,
450
+ "f":0.7818867925
451
  },
452
  "compound:prt":{
453
+ "p":0.7736842105,
454
+ "r":0.6901408451,
455
+ "f":0.729528536
456
  },
457
  "xcomp":{
458
+ "p":0.6559139785,
459
+ "r":0.6654545455,
460
+ "f":0.6606498195
461
  },
462
  "flat":{
463
+ "p":0.7821782178,
464
+ "r":0.7539766702,
465
+ "f":0.7678185745
466
  },
467
  "expl:pv":{
468
+ "p":0.8,
469
  "r":0.7272727273,
470
+ "f":0.7619047619
471
  },
472
  "acl":{
473
+ "p":0.5373134328,
474
+ "r":0.3673469388,
475
+ "f":0.4363636364
476
  },
477
  "advcl":{
478
+ "p":0.4953271028,
479
+ "r":0.4774774775,
480
+ "f":0.4862385321
481
  },
482
  "nummod":{
483
+ "p":0.798136646,
484
+ "r":0.8566666667,
485
+ "f":0.8263665595
486
  },
487
  "nmod":{
488
+ "p":0.7304785894,
489
  "r":0.7565217391,
490
+ "f":0.7432721059
491
  },
492
  "cc":{
493
+ "p":0.8598484848,
494
+ "r":0.8598484848,
495
+ "f":0.8598484848
496
  },
497
  "conj":{
498
+ "p":0.6921985816,
499
+ "r":0.6630434783,
500
+ "f":0.6773074254
501
  },
502
  "nsubj:pass":{
503
+ "p":0.8333333333,
504
+ "r":0.8490566038,
505
+ "f":0.8411214953
506
  },
507
  "aux:pass":{
508
+ "p":0.8918918919,
509
+ "r":0.9166666667,
510
+ "f":0.904109589
511
  },
512
+ "iobj":{
513
+ "p":0.5416666667,
514
+ "r":0.3939393939,
515
+ "f":0.4561403509
516
  },
517
+ "cop":{
518
+ "p":0.7738515901,
519
+ "r":0.8021978022,
520
+ "f":0.7877697842
521
  },
522
  "acl:relcl":{
523
+ "p":0.7142857143,
524
+ "r":0.7232704403,
525
+ "f":0.71875
526
  },
527
+ "parataxis":{
528
+ "p":0.3971291866,
529
+ "r":0.3007246377,
530
+ "f":0.3422680412
531
  },
532
+ "expl":{
533
+ "p":0.44,
534
+ "r":0.5238095238,
535
+ "f":0.4782608696
536
  },
537
  "fixed":{
538
+ "p":0.676056338,
539
+ "r":0.4339963834,
540
+ "f":0.5286343612
541
  },
542
  "obl:agent":{
543
+ "p":0.962962963,
544
  "r":0.8965517241,
545
+ "f":0.9285714286
546
  },
547
  "csubj":{
548
+ "p":0.5625,
549
  "r":0.45,
550
+ "f":0.5
551
  },
552
+ "orphan":{
553
  "p":0.0,
554
  "r":0.0,
555
  "f":0.0
556
  },
557
+ "dep":{
558
  "p":0.0,
559
  "r":0.0,
560
  "f":0.0
561
  }
562
  },
563
+ "ents_p":0.7850940666,
564
+ "ents_r":0.7503457815,
565
+ "ents_f":0.7673267327,
566
  "ents_per_type":{
567
+ "DATE":{
568
+ "p":0.0,
569
+ "r":0.0,
570
+ "f":0.0
571
+ },
572
  "PERSON":{
573
  "p":0.0,
574
  "r":0.0,
594
  "r":0.0,
595
  "f":0.0
596
  },
597
+ "EVENT":{
 
 
 
 
 
598
  "p":0.0,
599
  "r":0.0,
600
  "f":0.0
601
  },
602
+ "NORP":{
603
  "p":0.0,
604
  "r":0.0,
605
  "f":0.0
606
  },
607
+ "ORDINAL":{
608
  "p":0.0,
609
  "r":0.0,
610
  "f":0.0
611
  },
612
+ "LANGUAGE":{
613
  "p":0.0,
614
  "r":0.0,
615
  "f":0.0
616
  },
617
+ "FAC":{
618
  "p":0.0,
619
  "r":0.0,
620
  "f":0.0
621
  },
622
+ "WORK_OF_ART":{
623
  "p":0.0,
624
  "r":0.0,
625
  "f":0.0
626
  },
627
+ "LOC":{
628
  "p":0.0,
629
  "r":0.0,
630
  "f":0.0
631
  },
632
+ "PRODUCT":{
633
  "p":0.0,
634
  "r":0.0,
635
  "f":0.0
636
  },
637
+ "MONEY":{
638
  "p":0.0,
639
  "r":0.0,
640
  "f":0.0
641
  },
642
+ "TIME":{
643
  "p":0.0,
644
  "r":0.0,
645
  "f":0.0
646
  },
647
+ "LAW":{
648
  "p":0.0,
649
  "r":0.0,
650
  "f":0.0
651
  },
652
+ "PERCENT":{
653
  "p":0.0,
654
  "r":0.0,
655
  "f":0.0
656
  }
657
  },
658
+ "speed":10878.7516353688,
659
+ "token_acc":0.999433329,
660
  "token_p":0.9974281853,
661
  "token_r":0.9975586363,
662
  "token_f":0.9974934066,
663
+ "pos_acc":0.9638822246,
664
+ "morph_acc":0.9628967172,
665
+ "morph_micro_p":0.9711903659,
666
+ "morph_micro_r":0.9546965351,
667
+ "morph_micro_f":0.9628728216,
668
  "morph_per_feat":{
669
  "Person":{
670
+ "p":0.9912280702,
671
+ "r":0.9722753346,
672
+ "f":0.9816602317
673
  },
674
  "Poss":{
675
+ "p":0.992248062,
676
+ "r":0.9808429119,
677
+ "f":0.9865125241
678
  },
679
  "PronType":{
680
+ "p":0.989787234,
681
+ "r":0.9667497922,
682
+ "f":0.9781328848
683
  },
684
  "Gender":{
685
+ "p":0.9335968379,
686
+ "r":0.9012973798,
687
+ "f":0.9171628268
688
  },
689
  "Number":{
690
+ "p":0.980195003,
691
+ "r":0.9630294866,
692
+ "f":0.9715364288
693
  },
694
  "Tense":{
695
+ "p":0.9724517906,
696
+ "r":0.970313359,
697
+ "f":0.9713813979
698
  },
699
  "VerbForm":{
700
+ "p":0.9609261939,
701
+ "r":0.9557394746,
702
+ "f":0.9583258163
703
  },
704
  "Degree":{
705
+ "p":0.9626099707,
706
+ "r":0.9432471264,
707
+ "f":0.9528301887
708
  },
709
  "Definite":{
710
+ "p":0.9973439575,
711
+ "r":0.9916373239,
712
+ "f":0.9944824542
713
  },
714
  "Case":{
715
+ "p":0.996007984,
716
+ "r":0.9940239044,
717
+ "f":0.9950149551
718
  },
719
  "Reflex":{
720
  "p":1.0,
727
  "f":0.7142857143
728
  }
729
  },
730
+ "lemma_acc":0.9556229147
731
  },
732
  "sources":[
733
  {
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85008130e8c322f8f5cec41d1470689ab18b81a65681341b3a5b12b5e838e89c
3
  size 26038
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf620287e4ac94d40287bec36bbb949c9dcf6a59faaadfe69d7d6ea1fde5c33f
3
  size 26038
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13100cddcae2839fa86aa0979ef9eba092e9736a94459f92ef6309cb52071d35
3
- size 6511153
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3929a795336976b0ec60763be940b14d561eaf7d4e57c144720df057430b5d4
3
+ size 6380943
nl_core_news_lg-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f8ab23ba250ffeaf98a70822fcbf08ea1d6aa59774faacae113dfc8559fc4f4
3
- size 568072659
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e2ad45119b8fd79a1feab15265cc38710ce774a0609b530583b0987fe19deed
3
+ size 568082281
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:371ca1381fc2478487abd07478b549eebbc3a2e149f3127ff07dde2ced4ace73
3
  size 315229
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9836695a15d7a9cae3cc7f7fad7d0eaf2ff8c1537d5a7a34dd0220a994720d1c
3
  size 315229
senter/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb9fbbd1012c9276d1e34185cfe49de343ff355dc23b95a9e1800f2b828d942e
3
  size 219953
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b101fb1ac92e494e87dc115f99d1cfd275d588776c05cb430feb94fd6be67aba
3
  size 219953
tagger/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:506d4e1c7eee81e758cef57ed23e996af393cc74b1ab0d5001f84798f7297dcb
3
  size 79201
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78f9ab171de16a637d14af93709bea7e6d6025fa638114a7e46d045f83051481
3
  size 79201
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3136d0e6227a5efb09ef5e5ad159e3d22a41af10f57aee3344d782973405ee0
3
- size 6365604
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e44c937ab721fa448a4751a2a26c5c3ac5e8259a0de1a6889e51409ab638572
3
+ size 6495793
tokenizer CHANGED
The diff for this file is too large to render. See raw diff
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be0c25c54764ddfd5c4c89c2c416d5fa7e558bc4acd526b5aa730db3c0af2bb3
3
- size 10075413
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec7c061f59546f3b4f7ab6847541ee7d67760de7473bdfe265846ed770ea3b9d
3
+ size 10076113