EC2 Default User commited on
Commit
de00f6d
1 Parent(s): 796dea5

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,47 +14,41 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.898708838
18
  - name: NER Recall
19
  type: recall
20
- value: 0.8993389423
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.8990237797
24
  - task:
25
- name: POS
26
  type: token-classification
27
  metrics:
28
- - name: POS Accuracy
29
  type: accuracy
30
- value: 0.9780627094
31
  - task:
32
- name: SENTER
33
  type: token-classification
34
  metrics:
35
- - name: SENTER Precision
36
- type: precision
37
- value: 0.9568827385
38
- - name: SENTER Recall
39
- type: recall
40
- value: 0.8666798601
41
- - name: SENTER F Score
42
  type: f_score
43
- value: 0.9095503479
44
  - task:
45
- name: UNLABELED_DEPENDENCIES
46
  type: token-classification
47
  metrics:
48
- - name: Unlabeled Dependencies Accuracy
49
- type: accuracy
50
- value: 0.9527056513
51
  - task:
52
- name: LABELED_DEPENDENCIES
53
  type: token-classification
54
  metrics:
55
- - name: Labeled Dependencies Accuracy
56
- type: accuracy
57
- value: 0.9527056513
58
  ---
59
  ### Details: https://spacy.io/models/en#en_core_web_trf
60
 
@@ -63,8 +57,8 @@ English transformer pipeline (roberta-base). Components: transformer, tagger, pa
63
  | Feature | Description |
64
  | --- | --- |
65
  | **Name** | `en_core_web_trf` |
66
- | **Version** | `3.2.0` |
67
- | **spaCy** | `>=3.2.0,<3.3.0` |
68
  | **Default Pipeline** | `transformer`, `tagger`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
69
  | **Components** | `transformer`, `tagger`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
70
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -95,11 +89,11 @@ English transformer pipeline (roberta-base). Components: transformer, tagger, pa
95
  | `TOKEN_R` | 99.58 |
96
  | `TOKEN_F` | 99.57 |
97
  | `TAG_ACC` | 97.81 |
98
- | `SENTS_P` | 95.69 |
99
- | `SENTS_R` | 86.67 |
100
- | `SENTS_F` | 90.96 |
101
- | `DEP_UAS` | 95.27 |
102
- | `DEP_LAS` | 93.93 |
103
- | `ENTS_P` | 89.87 |
104
- | `ENTS_R` | 89.93 |
105
- | `ENTS_F` | 89.90 |
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.9010175297
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.8957832532
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.8983927675
24
  - task:
25
+ name: TAG
26
  type: token-classification
27
  metrics:
28
+ - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.9781090037
31
  - task:
32
+ name: UNLABELED_DEPENDENCIES
33
  type: token-classification
34
  metrics:
35
+ - name: Unlabeled Attachment Score (UAS)
 
 
 
 
 
 
36
  type: f_score
37
+ value: 0.9523761283
38
  - task:
39
+ name: LABELED_DEPENDENCIES
40
  type: token-classification
41
  metrics:
42
+ - name: Labeled Attachment Score (LAS)
43
+ type: f_score
44
+ value: 0.9391113934
45
  - task:
46
+ name: SENTS
47
  type: token-classification
48
  metrics:
49
+ - name: Sentences F-Score
50
+ type: f_score
51
+ value: 0.8975616543
52
  ---
53
  ### Details: https://spacy.io/models/en#en_core_web_trf
54
 
 
57
  | Feature | Description |
58
  | --- | --- |
59
  | **Name** | `en_core_web_trf` |
60
+ | **Version** | `3.3.0` |
61
+ | **spaCy** | `>=3.3.0.dev0,<3.4.0` |
62
  | **Default Pipeline** | `transformer`, `tagger`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
63
  | **Components** | `transformer`, `tagger`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
64
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
89
  | `TOKEN_R` | 99.58 |
90
  | `TOKEN_F` | 99.57 |
91
  | `TAG_ACC` | 97.81 |
92
+ | `SENTS_P` | 94.94 |
93
+ | `SENTS_R` | 85.11 |
94
+ | `SENTS_F` | 89.76 |
95
+ | `DEP_UAS` | 95.24 |
96
+ | `DEP_LAS` | 93.91 |
97
+ | `ENTS_P` | 90.10 |
98
+ | `ENTS_R` | 89.58 |
99
+ | `ENTS_F` | 89.84 |
accuracy.json CHANGED
@@ -1,330 +1,330 @@
1
  {
2
- "token_acc": 0.9993053983,
3
- "token_p": 0.9956742163,
4
- "token_r": 0.9957505887,
5
- "token_f": 0.9957124011,
6
- "tag_acc": 0.9780627094,
7
- "sents_p": 0.9568827385,
8
- "sents_r": 0.8666798601,
9
- "sents_f": 0.9095503479,
10
- "dep_uas": 0.9527056513,
11
- "dep_las": 0.9393298266,
12
  "dep_las_per_type": {
13
  "prep": {
14
- "p": 0.9229604964,
15
- "r": 0.9255169797,
16
- "f": 0.9242369702
17
  },
18
  "det": {
19
- "p": 0.9898046572,
20
- "r": 0.9896028704,
21
- "f": 0.9897037535
22
  },
23
  "pobj": {
24
- "p": 0.9832869081,
25
- "r": 0.9842136265,
26
- "f": 0.9837500491
27
  },
28
  "nsubj": {
29
- "p": 0.9803139249,
30
- "r": 0.9795837897,
31
- "f": 0.9799487213
32
  },
33
  "aux": {
34
- "p": 0.989571263,
35
- "r": 0.9883379329,
36
- "f": 0.9889542134
37
  },
38
  "advmod": {
39
- "p": 0.8962161255,
40
- "r": 0.8987043581,
41
- "f": 0.8974585171
42
  },
43
  "relcl": {
44
- "p": 0.8798724309,
45
- "r": 0.9009433962,
46
- "f": 0.8902832556
47
  },
48
  "root": {
49
- "p": 0.9664043142,
50
- "r": 0.8747938518,
51
- "f": 0.9183200028
52
  },
53
  "xcomp": {
54
- "p": 0.9438444924,
55
- "r": 0.9411342426,
56
- "f": 0.9424874191
57
  },
58
  "amod": {
59
- "p": 0.9413514387,
60
- "r": 0.943181082,
61
- "f": 0.9422653722
62
  },
63
  "compound": {
64
- "p": 0.951964576,
65
- "r": 0.9458676765,
66
- "f": 0.9489063329
67
  },
68
  "poss": {
69
- "p": 0.986728333,
70
- "r": 0.9877214171,
71
- "f": 0.9872246253
72
  },
73
  "ccomp": {
74
- "p": 0.8604651163,
75
- "r": 0.9118126273,
76
- "f": 0.8853950361
77
  },
78
  "attr": {
79
- "p": 0.9478225144,
80
  "r": 0.9701429773,
81
- "f": 0.9588528678
82
  },
83
  "case": {
84
- "p": 0.9890547264,
85
- "r": 0.994994995,
86
- "f": 0.9920159681
87
  },
88
  "mark": {
89
- "p": 0.9492105263,
90
- "r": 0.9557498675,
91
- "f": 0.9524689728
92
  },
93
  "intj": {
94
- "p": 0.6237388724,
95
- "r": 0.76996337,
96
- "f": 0.6891803279
97
  },
98
  "advcl": {
99
- "p": 0.8195836546,
100
- "r": 0.803072274,
101
- "f": 0.8112439583
102
  },
103
  "cc": {
104
- "p": 0.8986197049,
105
- "r": 0.9032412391,
106
- "f": 0.9009245452
107
  },
108
  "neg": {
109
- "p": 0.9574148297,
110
- "r": 0.958855996,
111
- "f": 0.9581348709
112
  },
113
  "conj": {
114
- "p": 0.8712776177,
115
- "r": 0.9133937563,
116
- "f": 0.8918387414
117
  },
118
  "nsubjpass": {
119
- "p": 0.9616182573,
120
- "r": 0.9507692308,
121
- "f": 0.9561629706
122
  },
123
  "auxpass": {
124
- "p": 0.9676979072,
125
- "r": 0.9690205011,
126
- "f": 0.9683587526
127
  },
128
  "dobj": {
129
- "p": 0.9742177522,
130
- "r": 0.9725874572,
131
- "f": 0.9734019221
132
  },
133
  "nummod": {
134
- "p": 0.9582800102,
135
- "r": 0.9454545455,
136
- "f": 0.9518240753
137
  },
138
  "npadvmod": {
139
- "p": 0.8582474227,
140
- "r": 0.8280639432,
141
- "f": 0.8428855541
142
  },
143
  "prt": {
144
- "p": 0.896,
145
- "r": 0.9032258065,
146
- "f": 0.8995983936
147
  },
148
  "pcomp": {
149
- "p": 0.9316901408,
150
- "r": 0.9264705882,
151
- "f": 0.9290730337
152
  },
153
  "expl": {
154
- "p": 0.9893617021,
155
  "r": 0.9957173448,
156
- "f": 0.992529349
157
  },
158
  "acl": {
159
- "p": 0.8476138829,
160
- "r": 0.852700491,
161
- "f": 0.8501495785
162
  },
163
  "agent": {
164
- "p": 0.9559859155,
165
- "r": 0.9731182796,
166
- "f": 0.9644760213
167
  },
168
  "dative": {
169
- "p": 0.8236607143,
170
- "r": 0.8463302752,
171
- "f": 0.834841629
172
  },
173
  "acomp": {
174
- "p": 0.9352355072,
175
- "r": 0.9365079365,
176
- "f": 0.9358712894
177
  },
178
  "dep": {
179
- "p": 0.3949044586,
180
- "r": 0.4025974026,
181
- "f": 0.3987138264
182
  },
183
  "csubj": {
184
- "p": 0.8928571429,
185
- "r": 0.8875739645,
186
- "f": 0.8902077151
187
  },
188
  "quantmod": {
189
- "p": 0.8867449664,
190
- "r": 0.8586515028,
191
- "f": 0.872472142
192
  },
193
  "nmod": {
194
- "p": 0.82904795,
195
- "r": 0.7269957343,
196
- "f": 0.7746753247
197
  },
198
  "appos": {
199
- "p": 0.8099701747,
200
- "r": 0.8247288503,
201
- "f": 0.8172828891
202
  },
203
  "predet": {
204
- "p": 0.8508064516,
205
- "r": 0.9055793991,
206
- "f": 0.8773388773
207
  },
208
  "preconj": {
209
- "p": 0.7083333333,
210
- "r": 0.7906976744,
211
- "f": 0.7472527473
212
  },
213
  "oprd": {
214
- "p": 0.9022082019,
215
- "r": 0.8537313433,
216
- "f": 0.8773006135
217
  },
218
  "parataxis": {
219
- "p": 0.5602189781,
220
- "r": 0.6659436009,
221
- "f": 0.6085232904
222
  },
223
  "meta": {
224
- "p": 0.1683168317,
225
- "r": 0.6538461538,
226
- "f": 0.2677165354
227
  },
228
  "csubjpass": {
229
- "p": 0.8333333333,
230
  "r": 0.8333333333,
231
- "f": 0.8333333333
232
  }
233
  },
234
- "ents_p": 0.898708838,
235
- "ents_r": 0.8993389423,
236
- "ents_f": 0.8990237797,
237
  "ents_per_type": {
238
  "DATE": {
239
- "p": 0.8928683632,
240
- "r": 0.9022222222,
241
- "f": 0.8975209222
242
  },
243
  "GPE": {
244
- "p": 0.9575551783,
245
- "r": 0.9439330544,
246
- "f": 0.9506953224
247
  },
248
  "ORDINAL": {
249
- "p": 0.8079268293,
250
- "r": 0.8229813665,
251
- "f": 0.8153846154
252
  },
253
  "ORG": {
254
- "p": 0.9032515991,
255
- "r": 0.8984623542,
256
- "f": 0.9008506114
257
  },
258
  "FAC": {
259
- "p": 0.5567010309,
260
- "r": 0.8307692308,
261
- "f": 0.6666666667
262
  },
263
  "QUANTITY": {
264
- "p": 0.8187134503,
265
- "r": 0.7692307692,
266
- "f": 0.7932011331
267
  },
268
  "LOC": {
269
- "p": 0.8610169492,
270
- "r": 0.8089171975,
271
- "f": 0.8341543514
272
  },
273
  "CARDINAL": {
274
- "p": 0.8530092593,
275
- "r": 0.8763376932,
276
- "f": 0.864516129
277
  },
278
  "PERSON": {
279
- "p": 0.9436258808,
280
- "r": 0.9614882507,
281
- "f": 0.9524733269
282
  },
283
  "NORP": {
284
- "p": 0.9211783439,
285
- "r": 0.9256,
286
- "f": 0.9233838787
287
- },
288
- "LAW": {
289
- "p": 0.5324675325,
290
- "r": 0.640625,
291
- "f": 0.5815602837
292
  },
293
  "PRODUCT": {
294
- "p": 0.649122807,
295
- "r": 0.5260663507,
296
- "f": 0.5811518325
297
- },
298
- "MONEY": {
299
- "p": 0.9157641396,
300
- "r": 0.8984651712,
301
- "f": 0.9070321812
302
  },
303
  "TIME": {
304
- "p": 0.7514124294,
305
- "r": 0.7777777778,
306
- "f": 0.7643678161
307
  },
308
  "EVENT": {
309
- "p": 0.776119403,
310
- "r": 0.5977011494,
311
- "f": 0.6753246753
312
  },
313
  "WORK_OF_ART": {
314
- "p": 0.5684210526,
315
- "r": 0.5567010309,
316
- "f": 0.5625
 
 
 
 
 
 
 
 
 
 
317
  },
318
  "PERCENT": {
319
- "p": 0.9154929577,
320
- "r": 0.8958652374,
321
- "f": 0.9055727554
322
  },
323
  "LANGUAGE": {
324
- "p": 1.0,
325
- "r": 0.71875,
326
- "f": 0.8363636364
327
  }
328
  },
329
- "speed": 6163.7320781314
330
  }
 
1
  {
2
+ "token_acc": 0.9993092439,
3
+ "token_p": 0.9956819193,
4
+ "token_r": 0.9957659295,
5
+ "token_f": 0.9957239226,
6
+ "tag_acc": 0.9781090037,
7
+ "sents_p": 0.9493745401,
8
+ "sents_r": 0.8511115509,
9
+ "sents_f": 0.8975616543,
10
+ "dep_uas": 0.9523761283,
11
+ "dep_las": 0.9391113934,
12
  "dep_las_per_type": {
13
  "prep": {
14
+ "p": 0.9247690444,
15
+ "r": 0.926769114,
16
+ "f": 0.9257679989
17
  },
18
  "det": {
19
+ "p": 0.9905360202,
20
+ "r": 0.9900513741,
21
+ "f": 0.9902936378
22
  },
23
  "pobj": {
24
+ "p": 0.9833712448,
25
+ "r": 0.984645592,
26
+ "f": 0.9840080058
27
  },
28
  "nsubj": {
29
+ "p": 0.9803363405,
30
+ "r": 0.9807228916,
31
+ "f": 0.980529578
32
  },
33
  "aux": {
34
+ "p": 0.9889610968,
35
+ "r": 0.9889610968,
36
+ "f": 0.9889610968
37
  },
38
  "advmod": {
39
+ "p": 0.8984309094,
40
+ "r": 0.8960121151,
41
+ "f": 0.8972198821
42
  },
43
  "relcl": {
44
+ "p": 0.8840270366,
45
+ "r": 0.9016690856,
46
+ "f": 0.8927609125
47
  },
48
  "root": {
49
+ "p": 0.9666642137,
50
+ "r": 0.8665479253,
51
+ "f": 0.9138722694
52
  },
53
  "xcomp": {
54
+ "p": 0.943443804,
55
+ "r": 0.94005743,
56
+ "f": 0.9417475728
57
  },
58
  "amod": {
59
+ "p": 0.9405806452,
60
+ "r": 0.9445416262,
61
+ "f": 0.9425569743
62
  },
63
  "compound": {
64
+ "p": 0.9541804705,
65
+ "r": 0.9463689018,
66
+ "f": 0.9502586327
67
  },
68
  "poss": {
69
+ "p": 0.9857429719,
70
+ "r": 0.9881239936,
71
+ "f": 0.9869320466
72
  },
73
  "ccomp": {
74
+ "p": 0.8517110266,
75
+ "r": 0.9124236253,
76
+ "f": 0.8810226155
77
  },
78
  "attr": {
79
+ "p": 0.9533057851,
80
  "r": 0.9701429773,
81
+ "f": 0.9616506878
82
  },
83
  "case": {
84
+ "p": 0.988065639,
85
+ "r": 0.9944944945,
86
+ "f": 0.9912696433
87
  },
88
  "mark": {
89
+ "p": 0.9488054608,
90
+ "r": 0.9576046635,
91
+ "f": 0.9531847554
92
  },
93
  "intj": {
94
+ "p": 0.6185935638,
95
+ "r": 0.7604395604,
96
+ "f": 0.6822214919
97
  },
98
  "advcl": {
99
+ "p": 0.8142160636,
100
+ "r": 0.7990430622,
101
+ "f": 0.8065582105
102
  },
103
  "cc": {
104
+ "p": 0.8911596958,
105
+ "r": 0.8970218873,
106
+ "f": 0.8940811826
107
  },
108
  "neg": {
109
+ "p": 0.9585207396,
110
+ "r": 0.962368289,
111
+ "f": 0.960440661
112
  },
113
  "conj": {
114
+ "p": 0.8622285511,
115
+ "r": 0.914652568,
116
+ "f": 0.8876672164
117
  },
118
  "nsubjpass": {
119
+ "p": 0.9548717949,
120
+ "r": 0.9548717949,
121
+ "f": 0.9548717949
122
  },
123
  "auxpass": {
124
+ "p": 0.9656264134,
125
+ "r": 0.9726651481,
126
+ "f": 0.9691330005
127
  },
128
  "dobj": {
129
+ "p": 0.9753194888,
130
+ "r": 0.9730655829,
131
+ "f": 0.9741912322
132
  },
133
  "nummod": {
134
+ "p": 0.9523326572,
135
+ "r": 0.9484848485,
136
+ "f": 0.9504048583
137
  },
138
  "npadvmod": {
139
+ "p": 0.8493250638,
140
+ "r": 0.8269982238,
141
+ "f": 0.838012959
142
  },
143
  "prt": {
144
+ "p": 0.887434555,
145
+ "r": 0.9112903226,
146
+ "f": 0.899204244
147
  },
148
  "pcomp": {
149
+ "p": 0.9300353357,
150
+ "r": 0.9215686275,
151
+ "f": 0.925782624
152
  },
153
  "expl": {
154
+ "p": 0.9914712154,
155
  "r": 0.9957173448,
156
+ "f": 0.9935897436
157
  },
158
  "acl": {
159
+ "p": 0.8481561822,
160
+ "r": 0.8532460447,
161
+ "f": 0.8506935001
162
  },
163
  "agent": {
164
+ "p": 0.9544658494,
165
+ "r": 0.976702509,
166
+ "f": 0.9654561559
167
  },
168
  "dative": {
169
+ "p": 0.8351893096,
170
+ "r": 0.8600917431,
171
+ "f": 0.8474576271
172
  },
173
  "acomp": {
174
+ "p": 0.9416058394,
175
+ "r": 0.9360544218,
176
+ "f": 0.938821924
177
  },
178
  "dep": {
179
+ "p": 0.4133986928,
180
+ "r": 0.4107142857,
181
+ "f": 0.4120521173
182
  },
183
  "csubj": {
184
+ "p": 0.875,
185
+ "r": 0.9112426036,
186
+ "f": 0.8927536232
187
  },
188
  "quantmod": {
189
+ "p": 0.8812131424,
190
+ "r": 0.8497156783,
191
+ "f": 0.8651778329
192
  },
193
  "nmod": {
194
+ "p": 0.826026444,
195
+ "r": 0.7233394272,
196
+ "f": 0.771280052
197
  },
198
  "appos": {
199
+ "p": 0.8161953728,
200
+ "r": 0.8264642082,
201
+ "f": 0.8212976935
202
  },
203
  "predet": {
204
+ "p": 0.8606557377,
205
+ "r": 0.9012875536,
206
+ "f": 0.8805031447
207
  },
208
  "preconj": {
209
+ "p": 0.6818181818,
210
+ "r": 0.6976744186,
211
+ "f": 0.6896551724
212
  },
213
  "oprd": {
214
+ "p": 0.900621118,
215
+ "r": 0.8656716418,
216
+ "f": 0.8828006088
217
  },
218
  "parataxis": {
219
+ "p": 0.5811808118,
220
+ "r": 0.68329718,
221
+ "f": 0.628115653
222
  },
223
  "meta": {
224
+ "p": 0.1923076923,
225
+ "r": 0.5769230769,
226
+ "f": 0.2884615385
227
  },
228
  "csubjpass": {
229
+ "p": 0.7142857143,
230
  "r": 0.8333333333,
231
+ "f": 0.7692307692
232
  }
233
  },
234
+ "ents_p": 0.9010175297,
235
+ "ents_r": 0.8957832532,
236
+ "ents_f": 0.8983927675,
237
  "ents_per_type": {
238
  "DATE": {
239
+ "p": 0.8963878327,
240
+ "r": 0.8980952381,
241
+ "f": 0.8972407231
242
  },
243
  "GPE": {
244
+ "p": 0.9559197513,
245
+ "r": 0.9436541144,
246
+ "f": 0.949747333
247
  },
248
  "ORDINAL": {
249
+ "p": 0.8193146417,
250
+ "r": 0.8167701863,
251
+ "f": 0.8180404355
252
  },
253
  "ORG": {
254
+ "p": 0.9023156774,
255
+ "r": 0.8987274655,
256
+ "f": 0.9005179971
257
  },
258
  "FAC": {
259
+ "p": 0.5773809524,
260
+ "r": 0.7461538462,
261
+ "f": 0.6510067114
262
  },
263
  "QUANTITY": {
264
+ "p": 0.7333333333,
265
+ "r": 0.7252747253,
266
+ "f": 0.729281768
267
  },
268
  "LOC": {
269
+ "p": 0.84,
270
+ "r": 0.8025477707,
271
+ "f": 0.8208469055
272
  },
273
  "CARDINAL": {
274
+ "p": 0.8578227246,
275
+ "r": 0.8573127229,
276
+ "f": 0.8575676479
277
  },
278
  "PERSON": {
279
+ "p": 0.9433055734,
280
+ "r": 0.9611618799,
281
+ "f": 0.9521500162
282
  },
283
  "NORP": {
284
+ "p": 0.9350649351,
285
+ "r": 0.9216,
286
+ "f": 0.9282836422
 
 
 
 
 
287
  },
288
  "PRODUCT": {
289
+ "p": 0.7055214724,
290
+ "r": 0.5450236967,
291
+ "f": 0.614973262
 
 
 
 
 
292
  },
293
  "TIME": {
294
+ "p": 0.75,
295
+ "r": 0.7807017544,
296
+ "f": 0.7650429799
297
  },
298
  "EVENT": {
299
+ "p": 0.7744360902,
300
+ "r": 0.591954023,
301
+ "f": 0.671009772
302
  },
303
  "WORK_OF_ART": {
304
+ "p": 0.6022099448,
305
+ "r": 0.5618556701,
306
+ "f": 0.5813333333
307
+ },
308
+ "MONEY": {
309
+ "p": 0.9122596154,
310
+ "r": 0.8961038961,
311
+ "f": 0.904109589
312
+ },
313
+ "LAW": {
314
+ "p": 0.602739726,
315
+ "r": 0.6875,
316
+ "f": 0.6423357664
317
  },
318
  "PERCENT": {
319
+ "p": 0.9178515008,
320
+ "r": 0.8897396631,
321
+ "f": 0.9035769829
322
  },
323
  "LANGUAGE": {
324
+ "p": 0.96,
325
+ "r": 0.75,
326
+ "f": 0.8421052632
327
  }
328
  },
329
+ "speed": 4560.3818843877
330
  }
attribute_ruler/patterns CHANGED
Binary files a/attribute_ruler/patterns and b/attribute_ruler/patterns differ
 
config.cfg CHANGED
@@ -79,12 +79,14 @@ pooling = {"@layers":"reduce_mean.v1"}
79
 
80
  [components.tagger]
81
  factory = "tagger"
 
82
  overwrite = false
83
  scorer = {"@scorers":"spacy.tagger_scorer.v1"}
84
 
85
  [components.tagger.model]
86
- @architectures = "spacy.Tagger.v1"
87
  nO = null
 
88
 
89
  [components.tagger.model.tok2vec]
90
  @architectures = "spacy-transformers.TransformerListener.v1"
 
79
 
80
  [components.tagger]
81
  factory = "tagger"
82
+ neg_prefix = "!"
83
  overwrite = false
84
  scorer = {"@scorers":"spacy.tagger_scorer.v1"}
85
 
86
  [components.tagger.model]
87
+ @architectures = "spacy.Tagger.v2"
88
  nO = null
89
+ normalize = false
90
 
91
  [components.tagger.model.tok2vec]
92
  @architectures = "spacy-transformers.TransformerListener.v1"
en_core_web_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6be2ccfc1c30edb5690f5e2baecf2a0cabd23529c0abb84c67aedcf0dac86a2
3
- size 460235340
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b9e9c25ad280745ec44927ae28542de703b9dde747edb7926d45aa46439ef5a
3
+ size 460264217
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"en",
3
  "name":"core_web_trf",
4
- "version":"3.2.0",
5
  "description":"English transformer pipeline (roberta-base). Components: transformer, tagger, parser, ner, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
- "spacy_version":">=3.2.0,<3.3.0",
11
- "spacy_git_version":"bb26550e2",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -164,334 +164,334 @@
164
 
165
  ],
166
  "performance":{
167
- "token_acc":0.9993053983,
168
- "token_p":0.9956742163,
169
- "token_r":0.9957505887,
170
- "token_f":0.9957124011,
171
- "tag_acc":0.9780627094,
172
- "sents_p":0.9568827385,
173
- "sents_r":0.8666798601,
174
- "sents_f":0.9095503479,
175
- "dep_uas":0.9527056513,
176
- "dep_las":0.9393298266,
177
  "dep_las_per_type":{
178
  "prep":{
179
- "p":0.9229604964,
180
- "r":0.9255169797,
181
- "f":0.9242369702
182
  },
183
  "det":{
184
- "p":0.9898046572,
185
- "r":0.9896028704,
186
- "f":0.9897037535
187
  },
188
  "pobj":{
189
- "p":0.9832869081,
190
- "r":0.9842136265,
191
- "f":0.9837500491
192
  },
193
  "nsubj":{
194
- "p":0.9803139249,
195
- "r":0.9795837897,
196
- "f":0.9799487213
197
  },
198
  "aux":{
199
- "p":0.989571263,
200
- "r":0.9883379329,
201
- "f":0.9889542134
202
  },
203
  "advmod":{
204
- "p":0.8962161255,
205
- "r":0.8987043581,
206
- "f":0.8974585171
207
  },
208
  "relcl":{
209
- "p":0.8798724309,
210
- "r":0.9009433962,
211
- "f":0.8902832556
212
  },
213
  "root":{
214
- "p":0.9664043142,
215
- "r":0.8747938518,
216
- "f":0.9183200028
217
  },
218
  "xcomp":{
219
- "p":0.9438444924,
220
- "r":0.9411342426,
221
- "f":0.9424874191
222
  },
223
  "amod":{
224
- "p":0.9413514387,
225
- "r":0.943181082,
226
- "f":0.9422653722
227
  },
228
  "compound":{
229
- "p":0.951964576,
230
- "r":0.9458676765,
231
- "f":0.9489063329
232
  },
233
  "poss":{
234
- "p":0.986728333,
235
- "r":0.9877214171,
236
- "f":0.9872246253
237
  },
238
  "ccomp":{
239
- "p":0.8604651163,
240
- "r":0.9118126273,
241
- "f":0.8853950361
242
  },
243
  "attr":{
244
- "p":0.9478225144,
245
  "r":0.9701429773,
246
- "f":0.9588528678
247
  },
248
  "case":{
249
- "p":0.9890547264,
250
- "r":0.994994995,
251
- "f":0.9920159681
252
  },
253
  "mark":{
254
- "p":0.9492105263,
255
- "r":0.9557498675,
256
- "f":0.9524689728
257
  },
258
  "intj":{
259
- "p":0.6237388724,
260
- "r":0.76996337,
261
- "f":0.6891803279
262
  },
263
  "advcl":{
264
- "p":0.8195836546,
265
- "r":0.803072274,
266
- "f":0.8112439583
267
  },
268
  "cc":{
269
- "p":0.8986197049,
270
- "r":0.9032412391,
271
- "f":0.9009245452
272
  },
273
  "neg":{
274
- "p":0.9574148297,
275
- "r":0.958855996,
276
- "f":0.9581348709
277
  },
278
  "conj":{
279
- "p":0.8712776177,
280
- "r":0.9133937563,
281
- "f":0.8918387414
282
  },
283
  "nsubjpass":{
284
- "p":0.9616182573,
285
- "r":0.9507692308,
286
- "f":0.9561629706
287
  },
288
  "auxpass":{
289
- "p":0.9676979072,
290
- "r":0.9690205011,
291
- "f":0.9683587526
292
  },
293
  "dobj":{
294
- "p":0.9742177522,
295
- "r":0.9725874572,
296
- "f":0.9734019221
297
  },
298
  "nummod":{
299
- "p":0.9582800102,
300
- "r":0.9454545455,
301
- "f":0.9518240753
302
  },
303
  "npadvmod":{
304
- "p":0.8582474227,
305
- "r":0.8280639432,
306
- "f":0.8428855541
307
  },
308
  "prt":{
309
- "p":0.896,
310
- "r":0.9032258065,
311
- "f":0.8995983936
312
  },
313
  "pcomp":{
314
- "p":0.9316901408,
315
- "r":0.9264705882,
316
- "f":0.9290730337
317
  },
318
  "expl":{
319
- "p":0.9893617021,
320
  "r":0.9957173448,
321
- "f":0.992529349
322
  },
323
  "acl":{
324
- "p":0.8476138829,
325
- "r":0.852700491,
326
- "f":0.8501495785
327
  },
328
  "agent":{
329
- "p":0.9559859155,
330
- "r":0.9731182796,
331
- "f":0.9644760213
332
  },
333
  "dative":{
334
- "p":0.8236607143,
335
- "r":0.8463302752,
336
- "f":0.834841629
337
  },
338
  "acomp":{
339
- "p":0.9352355072,
340
- "r":0.9365079365,
341
- "f":0.9358712894
342
  },
343
  "dep":{
344
- "p":0.3949044586,
345
- "r":0.4025974026,
346
- "f":0.3987138264
347
  },
348
  "csubj":{
349
- "p":0.8928571429,
350
- "r":0.8875739645,
351
- "f":0.8902077151
352
  },
353
  "quantmod":{
354
- "p":0.8867449664,
355
- "r":0.8586515028,
356
- "f":0.872472142
357
  },
358
  "nmod":{
359
- "p":0.82904795,
360
- "r":0.7269957343,
361
- "f":0.7746753247
362
  },
363
  "appos":{
364
- "p":0.8099701747,
365
- "r":0.8247288503,
366
- "f":0.8172828891
367
  },
368
  "predet":{
369
- "p":0.8508064516,
370
- "r":0.9055793991,
371
- "f":0.8773388773
372
  },
373
  "preconj":{
374
- "p":0.7083333333,
375
- "r":0.7906976744,
376
- "f":0.7472527473
377
  },
378
  "oprd":{
379
- "p":0.9022082019,
380
- "r":0.8537313433,
381
- "f":0.8773006135
382
  },
383
  "parataxis":{
384
- "p":0.5602189781,
385
- "r":0.6659436009,
386
- "f":0.6085232904
387
  },
388
  "meta":{
389
- "p":0.1683168317,
390
- "r":0.6538461538,
391
- "f":0.2677165354
392
  },
393
  "csubjpass":{
394
- "p":0.8333333333,
395
  "r":0.8333333333,
396
- "f":0.8333333333
397
  }
398
  },
399
- "ents_p":0.898708838,
400
- "ents_r":0.8993389423,
401
- "ents_f":0.8990237797,
402
  "ents_per_type":{
403
  "DATE":{
404
- "p":0.8928683632,
405
- "r":0.9022222222,
406
- "f":0.8975209222
407
  },
408
  "GPE":{
409
- "p":0.9575551783,
410
- "r":0.9439330544,
411
- "f":0.9506953224
412
  },
413
  "ORDINAL":{
414
- "p":0.8079268293,
415
- "r":0.8229813665,
416
- "f":0.8153846154
417
  },
418
  "ORG":{
419
- "p":0.9032515991,
420
- "r":0.8984623542,
421
- "f":0.9008506114
422
  },
423
  "FAC":{
424
- "p":0.5567010309,
425
- "r":0.8307692308,
426
- "f":0.6666666667
427
  },
428
  "QUANTITY":{
429
- "p":0.8187134503,
430
- "r":0.7692307692,
431
- "f":0.7932011331
432
  },
433
  "LOC":{
434
- "p":0.8610169492,
435
- "r":0.8089171975,
436
- "f":0.8341543514
437
  },
438
  "CARDINAL":{
439
- "p":0.8530092593,
440
- "r":0.8763376932,
441
- "f":0.864516129
442
  },
443
  "PERSON":{
444
- "p":0.9436258808,
445
- "r":0.9614882507,
446
- "f":0.9524733269
447
  },
448
  "NORP":{
449
- "p":0.9211783439,
450
- "r":0.9256,
451
- "f":0.9233838787
452
- },
453
- "LAW":{
454
- "p":0.5324675325,
455
- "r":0.640625,
456
- "f":0.5815602837
457
  },
458
  "PRODUCT":{
459
- "p":0.649122807,
460
- "r":0.5260663507,
461
- "f":0.5811518325
462
- },
463
- "MONEY":{
464
- "p":0.9157641396,
465
- "r":0.8984651712,
466
- "f":0.9070321812
467
  },
468
  "TIME":{
469
- "p":0.7514124294,
470
- "r":0.7777777778,
471
- "f":0.7643678161
472
  },
473
  "EVENT":{
474
- "p":0.776119403,
475
- "r":0.5977011494,
476
- "f":0.6753246753
477
  },
478
  "WORK_OF_ART":{
479
- "p":0.5684210526,
480
- "r":0.5567010309,
481
- "f":0.5625
 
 
 
 
 
 
 
 
 
 
482
  },
483
  "PERCENT":{
484
- "p":0.9154929577,
485
- "r":0.8958652374,
486
- "f":0.9055727554
487
  },
488
  "LANGUAGE":{
489
- "p":1.0,
490
- "r":0.71875,
491
- "f":0.8363636364
492
  }
493
  },
494
- "speed":6163.7320781314
495
  },
496
  "sources":[
497
  {
 
1
  {
2
  "lang":"en",
3
  "name":"core_web_trf",
4
+ "version":"3.3.0",
5
  "description":"English transformer pipeline (roberta-base). Components: transformer, tagger, parser, ner, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
+ "spacy_version":">=3.3.0.dev0,<3.4.0",
11
+ "spacy_git_version":"849bef2de",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
164
 
165
  ],
166
  "performance":{
167
+ "token_acc":0.9993092439,
168
+ "token_p":0.9956819193,
169
+ "token_r":0.9957659295,
170
+ "token_f":0.9957239226,
171
+ "tag_acc":0.9781090037,
172
+ "sents_p":0.9493745401,
173
+ "sents_r":0.8511115509,
174
+ "sents_f":0.8975616543,
175
+ "dep_uas":0.9523761283,
176
+ "dep_las":0.9391113934,
177
  "dep_las_per_type":{
178
  "prep":{
179
+ "p":0.9247690444,
180
+ "r":0.926769114,
181
+ "f":0.9257679989
182
  },
183
  "det":{
184
+ "p":0.9905360202,
185
+ "r":0.9900513741,
186
+ "f":0.9902936378
187
  },
188
  "pobj":{
189
+ "p":0.9833712448,
190
+ "r":0.984645592,
191
+ "f":0.9840080058
192
  },
193
  "nsubj":{
194
+ "p":0.9803363405,
195
+ "r":0.9807228916,
196
+ "f":0.980529578
197
  },
198
  "aux":{
199
+ "p":0.9889610968,
200
+ "r":0.9889610968,
201
+ "f":0.9889610968
202
  },
203
  "advmod":{
204
+ "p":0.8984309094,
205
+ "r":0.8960121151,
206
+ "f":0.8972198821
207
  },
208
  "relcl":{
209
+ "p":0.8840270366,
210
+ "r":0.9016690856,
211
+ "f":0.8927609125
212
  },
213
  "root":{
214
+ "p":0.9666642137,
215
+ "r":0.8665479253,
216
+ "f":0.9138722694
217
  },
218
  "xcomp":{
219
+ "p":0.943443804,
220
+ "r":0.94005743,
221
+ "f":0.9417475728
222
  },
223
  "amod":{
224
+ "p":0.9405806452,
225
+ "r":0.9445416262,
226
+ "f":0.9425569743
227
  },
228
  "compound":{
229
+ "p":0.9541804705,
230
+ "r":0.9463689018,
231
+ "f":0.9502586327
232
  },
233
  "poss":{
234
+ "p":0.9857429719,
235
+ "r":0.9881239936,
236
+ "f":0.9869320466
237
  },
238
  "ccomp":{
239
+ "p":0.8517110266,
240
+ "r":0.9124236253,
241
+ "f":0.8810226155
242
  },
243
  "attr":{
244
+ "p":0.9533057851,
245
  "r":0.9701429773,
246
+ "f":0.9616506878
247
  },
248
  "case":{
249
+ "p":0.988065639,
250
+ "r":0.9944944945,
251
+ "f":0.9912696433
252
  },
253
  "mark":{
254
+ "p":0.9488054608,
255
+ "r":0.9576046635,
256
+ "f":0.9531847554
257
  },
258
  "intj":{
259
+ "p":0.6185935638,
260
+ "r":0.7604395604,
261
+ "f":0.6822214919
262
  },
263
  "advcl":{
264
+ "p":0.8142160636,
265
+ "r":0.7990430622,
266
+ "f":0.8065582105
267
  },
268
  "cc":{
269
+ "p":0.8911596958,
270
+ "r":0.8970218873,
271
+ "f":0.8940811826
272
  },
273
  "neg":{
274
+ "p":0.9585207396,
275
+ "r":0.962368289,
276
+ "f":0.960440661
277
  },
278
  "conj":{
279
+ "p":0.8622285511,
280
+ "r":0.914652568,
281
+ "f":0.8876672164
282
  },
283
  "nsubjpass":{
284
+ "p":0.9548717949,
285
+ "r":0.9548717949,
286
+ "f":0.9548717949
287
  },
288
  "auxpass":{
289
+ "p":0.9656264134,
290
+ "r":0.9726651481,
291
+ "f":0.9691330005
292
  },
293
  "dobj":{
294
+ "p":0.9753194888,
295
+ "r":0.9730655829,
296
+ "f":0.9741912322
297
  },
298
  "nummod":{
299
+ "p":0.9523326572,
300
+ "r":0.9484848485,
301
+ "f":0.9504048583
302
  },
303
  "npadvmod":{
304
+ "p":0.8493250638,
305
+ "r":0.8269982238,
306
+ "f":0.838012959
307
  },
308
  "prt":{
309
+ "p":0.887434555,
310
+ "r":0.9112903226,
311
+ "f":0.899204244
312
  },
313
  "pcomp":{
314
+ "p":0.9300353357,
315
+ "r":0.9215686275,
316
+ "f":0.925782624
317
  },
318
  "expl":{
319
+ "p":0.9914712154,
320
  "r":0.9957173448,
321
+ "f":0.9935897436
322
  },
323
  "acl":{
324
+ "p":0.8481561822,
325
+ "r":0.8532460447,
326
+ "f":0.8506935001
327
  },
328
  "agent":{
329
+ "p":0.9544658494,
330
+ "r":0.976702509,
331
+ "f":0.9654561559
332
  },
333
  "dative":{
334
+ "p":0.8351893096,
335
+ "r":0.8600917431,
336
+ "f":0.8474576271
337
  },
338
  "acomp":{
339
+ "p":0.9416058394,
340
+ "r":0.9360544218,
341
+ "f":0.938821924
342
  },
343
  "dep":{
344
+ "p":0.4133986928,
345
+ "r":0.4107142857,
346
+ "f":0.4120521173
347
  },
348
  "csubj":{
349
+ "p":0.875,
350
+ "r":0.9112426036,
351
+ "f":0.8927536232
352
  },
353
  "quantmod":{
354
+ "p":0.8812131424,
355
+ "r":0.8497156783,
356
+ "f":0.8651778329
357
  },
358
  "nmod":{
359
+ "p":0.826026444,
360
+ "r":0.7233394272,
361
+ "f":0.771280052
362
  },
363
  "appos":{
364
+ "p":0.8161953728,
365
+ "r":0.8264642082,
366
+ "f":0.8212976935
367
  },
368
  "predet":{
369
+ "p":0.8606557377,
370
+ "r":0.9012875536,
371
+ "f":0.8805031447
372
  },
373
  "preconj":{
374
+ "p":0.6818181818,
375
+ "r":0.6976744186,
376
+ "f":0.6896551724
377
  },
378
  "oprd":{
379
+ "p":0.900621118,
380
+ "r":0.8656716418,
381
+ "f":0.8828006088
382
  },
383
  "parataxis":{
384
+ "p":0.5811808118,
385
+ "r":0.68329718,
386
+ "f":0.628115653
387
  },
388
  "meta":{
389
+ "p":0.1923076923,
390
+ "r":0.5769230769,
391
+ "f":0.2884615385
392
  },
393
  "csubjpass":{
394
+ "p":0.7142857143,
395
  "r":0.8333333333,
396
+ "f":0.7692307692
397
  }
398
  },
399
+ "ents_p":0.9010175297,
400
+ "ents_r":0.8957832532,
401
+ "ents_f":0.8983927675,
402
  "ents_per_type":{
403
  "DATE":{
404
+ "p":0.8963878327,
405
+ "r":0.8980952381,
406
+ "f":0.8972407231
407
  },
408
  "GPE":{
409
+ "p":0.9559197513,
410
+ "r":0.9436541144,
411
+ "f":0.949747333
412
  },
413
  "ORDINAL":{
414
+ "p":0.8193146417,
415
+ "r":0.8167701863,
416
+ "f":0.8180404355
417
  },
418
  "ORG":{
419
+ "p":0.9023156774,
420
+ "r":0.8987274655,
421
+ "f":0.9005179971
422
  },
423
  "FAC":{
424
+ "p":0.5773809524,
425
+ "r":0.7461538462,
426
+ "f":0.6510067114
427
  },
428
  "QUANTITY":{
429
+ "p":0.7333333333,
430
+ "r":0.7252747253,
431
+ "f":0.729281768
432
  },
433
  "LOC":{
434
+ "p":0.84,
435
+ "r":0.8025477707,
436
+ "f":0.8208469055
437
  },
438
  "CARDINAL":{
439
+ "p":0.8578227246,
440
+ "r":0.8573127229,
441
+ "f":0.8575676479
442
  },
443
  "PERSON":{
444
+ "p":0.9433055734,
445
+ "r":0.9611618799,
446
+ "f":0.9521500162
447
  },
448
  "NORP":{
449
+ "p":0.9350649351,
450
+ "r":0.9216,
451
+ "f":0.9282836422
 
 
 
 
 
452
  },
453
  "PRODUCT":{
454
+ "p":0.7055214724,
455
+ "r":0.5450236967,
456
+ "f":0.614973262
 
 
 
 
 
457
  },
458
  "TIME":{
459
+ "p":0.75,
460
+ "r":0.7807017544,
461
+ "f":0.7650429799
462
  },
463
  "EVENT":{
464
+ "p":0.7744360902,
465
+ "r":0.591954023,
466
+ "f":0.671009772
467
  },
468
  "WORK_OF_ART":{
469
+ "p":0.6022099448,
470
+ "r":0.5618556701,
471
+ "f":0.5813333333
472
+ },
473
+ "MONEY":{
474
+ "p":0.9122596154,
475
+ "r":0.8961038961,
476
+ "f":0.904109589
477
+ },
478
+ "LAW":{
479
+ "p":0.602739726,
480
+ "r":0.6875,
481
+ "f":0.6423357664
482
  },
483
  "PERCENT":{
484
+ "p":0.9178515008,
485
+ "r":0.8897396631,
486
+ "f":0.9035769829
487
  },
488
  "LANGUAGE":{
489
+ "p":0.96,
490
+ "r":0.75,
491
+ "f":0.8421052632
492
  }
493
  },
494
+ "speed":4560.3818843877
495
  },
496
  "sources":[
497
  {
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0528da41f0a5f7c271952e4e0971577d4087657bca5020c9fdd3156b59018159
3
  size 313773
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54f1dee6cc18cf947f58399dd71dd1614fcb292dd8eedaa56e15ef5edd2c1f90
3
  size 313773
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70f5df71128c7ee60cef6a634570533edf331b2691f416a6f83af44a809c70c6
3
  size 639549
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66bbb798aed08a965b1cfcc8227d44d23cecb6b981c72a6ab75a75cc9d0067ed
3
  size 639549
parser/moves CHANGED
@@ -1,2 +1,2 @@
1
  ��moves�
2
- {"0":{"":998775},"1":{"":991589},"2":{"det":172362,"nsubj":165533,"compound":116785,"amod":106476,"aux":87529,"punct":65947,"advmod":62668,"poss":36414,"mark":27883,"nummod":22585,"auxpass":15606,"prep":13980,"nsubjpass":13870,"neg":12358,"cc":10624,"nmod":9673,"advcl":9067,"npadvmod":8136,"intj":7304,"quantmod":7085,"ccomp":5903,"dep":4276,"dobj":3429,"expl":3360,"predet":1943,"parataxis":1820,"csubj":1431,"preconj":618,"pobj||prep":616,"attr":578,"meta":488,"advmod||conj":366,"dobj||xcomp":352,"acomp":286,"nsubj||ccomp":224,"dative":206,"advmod||xcomp":149,"dobj||ccomp":69,"csubjpass":64,"dobj||conj":62,"prep||conj":51,"acl":48,"prep||nsubj":41,"prep||dobj":36,"xcomp":34,"advmod||ccomp":32,"oprd":31},"3":{"punct":184785,"pobj":182420,"prep":173757,"dobj":89733,"conj":59725,"cc":51786,"ccomp":30428,"advmod":22774,"xcomp":21051,"relcl":20972,"advcl":19826,"attr":17749,"acomp":16726,"appos":14981,"case":13368,"acl":12100,"pcomp":10370,"npadvmod":9727,"prt":8176,"dative":3867,"agent":3850,"nsubj":3471,"intj":3278,"amod":2850,"neg":2843,"nummod":2503,"oprd":2307,"dep":1634,"parataxis":1258,"nmod":339,"quantmod":317,"acl||dobj":202,"prep||dobj":190,"prep||nsubj":162,"acl||nsubj":159,"appos||nsubj":145,"relcl||dobj":134,"relcl||nsubj":111,"aux":103,"expl":96,"meta":92,"appos||dobj":86,"preconj":71,"csubj":65,"prep||nsubjpass":55,"prep||advmod":54,"prep||acomp":53,"det":51,"nsubjpass":45,"acl||nsubjpass":42,"relcl||pobj":41,"mark":40,"auxpass":39,"prep||pobj":36,"relcl||nsubjpass":32,"appos||nsubjpass":32},"4":{"ROOT":110284}}�cfg��neg_key�
 
1
  ��moves�
2
+ {"0":{"":994267},"1":{"":990803},"2":{"det":172595,"nsubj":165748,"compound":116623,"amod":105184,"aux":86667,"punct":65478,"advmod":62763,"poss":36443,"mark":27941,"nummod":22598,"auxpass":15594,"prep":14001,"nsubjpass":13856,"neg":12357,"cc":10739,"nmod":9562,"advcl":9062,"npadvmod":8168,"quantmod":7101,"intj":6464,"ccomp":5896,"dobj":3427,"expl":3360,"dep":2806,"predet":1944,"parataxis":1837,"csubj":1428,"preconj":621,"pobj||prep":616,"attr":578,"meta":376,"advmod||conj":368,"dobj||xcomp":352,"acomp":284,"nsubj||ccomp":224,"dative":206,"advmod||xcomp":149,"dobj||ccomp":70,"csubjpass":64,"dobj||conj":62,"prep||conj":51,"acl":48,"prep||nsubj":41,"prep||dobj":36,"xcomp":34,"advmod||ccomp":32,"oprd":31},"3":{"punct":183790,"pobj":182191,"prep":174008,"dobj":89615,"conj":59687,"cc":51930,"ccomp":30385,"advmod":22861,"xcomp":21021,"relcl":20969,"advcl":19828,"attr":17741,"acomp":16922,"appos":15265,"case":13388,"acl":12085,"pcomp":10324,"npadvmod":9796,"prt":8179,"agent":3903,"dative":3866,"nsubj":3470,"neg":2906,"amod":2839,"intj":2819,"nummod":2732,"oprd":2301,"dep":1487,"parataxis":1261,"quantmod":319,"nmod":294,"acl||dobj":200,"prep||dobj":190,"prep||nsubj":162,"acl||nsubj":159,"appos||nsubj":145,"relcl||dobj":134,"relcl||nsubj":111,"aux":103,"expl":96,"meta":92,"appos||dobj":86,"preconj":71,"csubj":65,"prep||nsubjpass":55,"prep||advmod":54,"prep||acomp":53,"det":51,"nsubjpass":45,"relcl||pobj":42,"acl||nsubjpass":42,"mark":40,"auxpass":39,"prep||pobj":36,"relcl||nsubjpass":32,"appos||nsubjpass":31},"4":{"ROOT":111664}}�cfg��neg_key�
tagger/cfg CHANGED
@@ -50,5 +50,6 @@
50
  "XX",
51
  "``"
52
  ],
 
53
  "overwrite":false
54
  }
 
50
  "XX",
51
  "``"
52
  ],
53
+ "neg_prefix":"!",
54
  "overwrite":false
55
  }
tagger/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:649ca7fcf30736f2fc257e85e22748fa8be5f4bd16752271a9106df40ef11073
3
- size 151314
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc134a18c25f9721bfa61b8e3ed78dcfaa6c3353d7fa94b8eac0f942d623e05d
3
+ size 151366
tokenizer CHANGED
The diff for this file is too large to render. See raw diff
 
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:523fefd9ecd5f2a76cb7f686222af0615942bc51d131339f5883a6190e7fdc72
3
- size 501274094
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c4e258b9080d8e3962a0a294397935bf53f857211d5c8a1b9b68ac94cca22f8
3
+ size 502027765
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6fda43452971a53ac720650d08c74297656aec52627651521ce4fbceaabce87
3
- size 1091378
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88ec87b408458d1bc7243553a79c4d969b3cdc825d129f388cb78fc2747aa581
3
+ size 1091428