adrianeboyd commited on
Commit
c70655e
β€’
1 Parent(s): e4a727e

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,51 +14,51 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.7588215895
18
  - name: NER Recall
19
  type: recall
20
- value: 0.7585714286
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.7586964884
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
- value: 0.9248343224
31
  - task:
32
  name: UNLABELED_DEPENDENCIES
33
  type: token-classification
34
  metrics:
35
  - name: Unlabeled Attachment Score (UAS)
36
  type: f_score
37
- value: 0.7702832979
38
  - task:
39
  name: LABELED_DEPENDENCIES
40
  type: token-classification
41
  metrics:
42
  - name: Labeled Attachment Score (LAS)
43
  type: f_score
44
- value: 0.7326537539
45
  - task:
46
  name: SENTS
47
  type: token-classification
48
  metrics:
49
  - name: Sentences F-Score
50
  type: f_score
51
- value: 0.6942608696
52
  ---
53
  ### Details: https://spacy.io/models/zh#zh_core_web_trf
54
 
55
- Chinese transformer pipeline (bert-base-chinese). Components: transformer, tagger, parser, ner, attribute_ruler.
56
 
57
  | Feature | Description |
58
  | --- | --- |
59
  | **Name** | `zh_core_web_trf` |
60
- | **Version** | `3.6.1` |
61
- | **spaCy** | `>=3.6.0,<3.7.0` |
62
  | **Default Pipeline** | `transformer`, `tagger`, `parser`, `attribute_ruler`, `ner` |
63
  | **Components** | `transformer`, `tagger`, `parser`, `attribute_ruler`, `ner` |
64
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -88,12 +88,12 @@ Chinese transformer pipeline (bert-base-chinese). Components: transformer, tagge
88
  | `TOKEN_P` | 94.58 |
89
  | `TOKEN_R` | 91.36 |
90
  | `TOKEN_F` | 92.94 |
91
- | `TAG_ACC` | 92.48 |
92
- | `SENTS_P` | 72.67 |
93
- | `SENTS_R` | 66.46 |
94
- | `SENTS_F` | 69.43 |
95
- | `DEP_UAS` | 77.03 |
96
- | `DEP_LAS` | 73.27 |
97
- | `ENTS_P` | 75.88 |
98
- | `ENTS_R` | 75.86 |
99
- | `ENTS_F` | 75.87 |
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.7608897127
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.7217582418
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.7408075795
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.9175332527
31
  - task:
32
  name: UNLABELED_DEPENDENCIES
33
  type: token-classification
34
  metrics:
35
  - name: Unlabeled Attachment Score (UAS)
36
  type: f_score
37
+ value: 0.7572203056
38
  - task:
39
  name: LABELED_DEPENDENCIES
40
  type: token-classification
41
  metrics:
42
  - name: Labeled Attachment Score (LAS)
43
  type: f_score
44
+ value: 0.7145288854
45
  - task:
46
  name: SENTS
47
  type: token-classification
48
  metrics:
49
  - name: Sentences F-Score
50
  type: f_score
51
+ value: 0.6920716113
52
  ---
53
  ### Details: https://spacy.io/models/zh#zh_core_web_trf
54
 
55
+ Chinese transformer pipeline (Transformer(name='bert-base-chinese', piece_encoder='bert-wordpiece', stride=152, type='bert', width=768, window=208, vocab_size=21128)). Components: transformer, tagger, parser, ner, attribute_ruler.
56
 
57
  | Feature | Description |
58
  | --- | --- |
59
  | **Name** | `zh_core_web_trf` |
60
+ | **Version** | `3.7.2` |
61
+ | **spaCy** | `>=3.7.0,<3.8.0` |
62
  | **Default Pipeline** | `transformer`, `tagger`, `parser`, `attribute_ruler`, `ner` |
63
  | **Components** | `transformer`, `tagger`, `parser`, `attribute_ruler`, `ner` |
64
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
88
  | `TOKEN_P` | 94.58 |
89
  | `TOKEN_R` | 91.36 |
90
  | `TOKEN_F` | 92.94 |
91
+ | `TAG_ACC` | 91.75 |
92
+ | `SENTS_P` | 70.92 |
93
+ | `SENTS_R` | 67.57 |
94
+ | `SENTS_F` | 69.21 |
95
+ | `DEP_UAS` | 75.72 |
96
+ | `DEP_LAS` | 71.45 |
97
+ | `ENTS_P` | 76.09 |
98
+ | `ENTS_R` | 72.18 |
99
+ | `ENTS_F` | 74.08 |
accuracy.json CHANGED
@@ -3,212 +3,207 @@
3
  "token_p": 0.9458325855,
4
  "token_r": 0.9136060443,
5
  "token_f": 0.9294400505,
6
- "tag_acc": 0.9248343224,
7
- "sents_p": 0.7267431276,
8
- "sents_r": 0.6645580156,
9
- "sents_f": 0.6942608696,
10
- "dep_uas": 0.7702832979,
11
- "dep_las": 0.7326537539,
12
  "dep_las_per_type": {
13
  "dep": {
14
- "p": 0.5677689191,
15
- "r": 0.4389208851,
16
- "f": 0.4950991566
17
  },
18
  "case": {
19
- "p": 0.9181494662,
20
- "r": 0.8445683802,
21
- "f": 0.8798231765
22
  },
23
  "nmod:tmod": {
24
- "p": 0.8106995885,
25
- "r": 0.8040816327,
26
- "f": 0.8073770492
27
  },
28
  "nummod": {
29
- "p": 0.9027635619,
30
- "r": 0.5876082612,
31
- "f": 0.7118644068
32
  },
33
  "mark:clf": {
34
- "p": 0.9524691358,
35
- "r": 0.5755315181,
36
- "f": 0.7175075564
37
  },
38
  "auxpass": {
39
- "p": 0.9243243243,
40
  "r": 0.9243243243,
41
- "f": 0.9243243243
42
  },
43
  "nsubj": {
44
- "p": 0.8731413262,
45
- "r": 0.8006387422,
46
- "f": 0.8353197488
47
  },
48
  "acl": {
49
- "p": 0.815270936,
50
- "r": 0.7343316694,
51
- "f": 0.7726874818
52
  },
53
  "advmod": {
54
- "p": 0.8811971373,
55
- "r": 0.7676263886,
56
- "f": 0.8205003938
57
  },
58
  "mark": {
59
- "p": 0.8466637207,
60
- "r": 0.8396143734,
61
- "f": 0.8431243124
62
  },
63
  "xcomp": {
64
- "p": 0.8116760829,
65
- "r": 0.7019543974,
66
- "f": 0.7528384279
67
  },
68
  "nmod:assmod": {
69
- "p": 0.8690516369,
70
- "r": 0.8014316838,
71
- "f": 0.833873057
72
  },
73
  "det": {
74
- "p": 0.8931726908,
75
- "r": 0.6514352665,
76
- "f": 0.7533875339
77
  },
78
  "amod": {
79
- "p": 0.8383475528,
80
- "r": 0.7333071485,
81
- "f": 0.7823172009
82
  },
83
  "nmod:prep": {
84
- "p": 0.839443313,
85
- "r": 0.7480338778,
86
- "f": 0.7911068458
87
  },
88
  "root": {
89
- "p": 0.7950441798,
90
- "r": 0.6890294656,
91
- "f": 0.7382502453
92
  },
93
  "aux:prtmod": {
94
- "p": 0.9437751004,
95
- "r": 0.8392857143,
96
- "f": 0.8884688091
97
  },
98
  "compound:nn": {
99
- "p": 0.8118741059,
100
- "r": 0.7681895093,
101
- "f": 0.7894279256
102
  },
103
  "dobj": {
104
- "p": 0.9199408187,
105
- "r": 0.8289142349,
106
- "f": 0.8720585944
107
  },
108
  "ccomp": {
109
- "p": 0.7878282618,
110
- "r": 0.734836703,
111
- "f": 0.7604103802
112
  },
113
  "advmod:rcomp": {
114
- "p": 0.8501529052,
115
- "r": 0.7700831025,
116
- "f": 0.8081395349
117
  },
118
  "nmod:topic": {
119
- "p": 0.5123674912,
120
- "r": 0.4707792208,
121
- "f": 0.4906937394
122
  },
123
  "cop": {
124
- "p": 0.8493150685,
125
- "r": 0.6383526384,
126
- "f": 0.7288758266
127
  },
128
  "discourse": {
129
- "p": 0.6115044248,
130
- "r": 0.5701320132,
131
- "f": 0.5900939368
132
  },
133
  "neg": {
134
- "p": 0.8767334361,
135
- "r": 0.6765755054,
136
- "f": 0.7637583893
137
  },
138
  "aux:modal": {
139
- "p": 0.9025191676,
140
- "r": 0.8521199586,
141
- "f": 0.8765957447
142
  },
143
  "nmod": {
144
- "p": 0.8147612156,
145
- "r": 0.7639077341,
146
- "f": 0.7885154062
147
  },
148
  "aux:ba": {
149
- "p": 0.9222222222,
150
- "r": 0.8829787234,
151
- "f": 0.902173913
152
  },
153
  "advmod:loc": {
154
- "p": 0.8146718147,
155
- "r": 0.6261127596,
156
- "f": 0.7080536913
157
  },
158
  "aux:asp": {
159
- "p": 0.930153322,
160
- "r": 0.8708133971,
161
- "f": 0.8995057661
162
  },
163
  "conj": {
164
- "p": 0.6438065883,
165
- "r": 0.631758034,
166
- "f": 0.6377254079
167
  },
168
  "nsubjpass": {
169
- "p": 0.8913043478,
170
- "r": 0.82,
171
- "f": 0.8541666667
172
  },
173
  "compound:vc": {
174
- "p": 0.5483870968,
175
- "r": 0.6165803109,
176
- "f": 0.5804878049
177
  },
178
  "advcl:loc": {
179
- "p": 0.7307692308,
180
- "r": 0.6785714286,
181
- "f": 0.7037037037
182
  },
183
  "cc": {
184
- "p": 0.8328530259,
185
- "r": 0.769299024,
186
- "f": 0.7998154982
187
  },
188
  "advmod:dvp": {
189
- "p": 0.893129771,
190
  "r": 0.7267080745,
191
- "f": 0.801369863
192
- },
193
- "amod:ordmod": {
194
- "p": 0.6885245902,
195
- "r": 0.65625,
196
- "f": 0.672
197
  },
198
  "appos": {
199
- "p": 0.9581280788,
200
- "r": 0.8942528736,
201
- "f": 0.9250891795
202
  },
203
  "nmod:poss": {
204
- "p": 0.7807017544,
205
- "r": 0.6592592593,
206
- "f": 0.7148594378
207
  },
208
  "name": {
209
- "p": 0.6517857143,
210
- "r": 0.5407407407,
211
- "f": 0.5910931174
212
  },
213
  "nsubj:xsubj": {
214
  "p": 0.0,
@@ -216,14 +211,19 @@
216
  "f": 0.0
217
  },
218
  "nmod:range": {
219
- "p": 0.8301158301,
220
- "r": 0.7214765101,
221
- "f": 0.7719928187
222
  },
223
  "parataxis:prnmod": {
224
- "p": 0.3647058824,
225
- "r": 0.2330827068,
226
- "f": 0.2844036697
 
 
 
 
 
227
  },
228
  "erased": {
229
  "p": 0.0,
@@ -231,105 +231,105 @@
231
  "f": 0.0
232
  },
233
  "etc": {
234
- "p": 0.8965517241,
235
- "r": 0.9285714286,
236
- "f": 0.9122807018
237
  }
238
  },
239
- "ents_p": 0.7588215895,
240
- "ents_r": 0.7585714286,
241
- "ents_f": 0.7586964884,
242
  "ents_per_type": {
243
  "DATE": {
244
- "p": 0.7731568998,
245
- "r": 0.810703667,
246
- "f": 0.7914852443
247
  },
248
  "GPE": {
249
- "p": 0.7989154993,
250
- "r": 0.8641251222,
251
- "f": 0.8302418408
252
- },
253
- "CARDINAL": {
254
- "p": 0.649321267,
255
- "r": 0.5786290323,
256
- "f": 0.6119402985
257
  },
258
  "ORDINAL": {
259
- "p": 0.8622754491,
260
- "r": 0.7578947368,
261
- "f": 0.8067226891
262
  },
263
  "FAC": {
264
- "p": 0.4974358974,
265
- "r": 0.5215053763,
266
- "f": 0.5091863517
267
- },
268
- "ORG": {
269
- "p": 0.749235474,
270
- "r": 0.7458143075,
271
- "f": 0.7475209764
272
- },
273
- "NORP": {
274
- "p": 0.6605080831,
275
- "r": 0.6008403361,
276
- "f": 0.6292629263
277
  },
278
  "LOC": {
279
- "p": 0.6323987539,
280
- "r": 0.5456989247,
281
- "f": 0.5858585859
282
  },
283
  "QUANTITY": {
284
- "p": 0.7244094488,
285
- "r": 0.6814814815,
286
- "f": 0.7022900763
287
  },
288
- "TIME": {
289
- "p": 0.7627906977,
290
- "r": 0.7961165049,
291
- "f": 0.7790973872
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
292
  },
293
  "WORK_OF_ART": {
294
- "p": 0.4444444444,
295
- "r": 0.32,
296
- "f": 0.3720930233
 
 
 
 
 
297
  },
298
  "MONEY": {
299
- "p": 0.896,
300
  "r": 0.8296296296,
301
- "f": 0.8615384615
302
  },
303
  "EVENT": {
304
- "p": 0.6026490066,
305
- "r": 0.6691176471,
306
- "f": 0.6341463415
307
- },
308
- "PRODUCT": {
309
- "p": 0.4722222222,
310
- "r": 0.3469387755,
311
- "f": 0.4
312
- },
313
- "PERSON": {
314
- "p": 0.8785803238,
315
- "r": 0.9091494845,
316
- "f": 0.8936035465
317
  },
318
  "PERCENT": {
319
- "p": 0.7888888889,
320
- "r": 0.8554216867,
321
- "f": 0.8208092486
 
 
 
 
 
322
  },
323
  "LAW": {
324
- "p": 0.375,
325
- "r": 0.3,
326
- "f": 0.3333333333
327
  },
328
  "LANGUAGE": {
329
- "p": 0.75,
330
- "r": 1.0,
331
- "f": 0.8571428571
332
  }
333
  },
334
- "speed": 3083.8656241516
335
  }
3
  "token_p": 0.9458325855,
4
  "token_r": 0.9136060443,
5
  "token_f": 0.9294400505,
6
+ "tag_acc": 0.9175332527,
7
+ "sents_p": 0.7092434038,
8
+ "sents_r": 0.6757116697,
9
+ "sents_f": 0.6920716113,
10
+ "dep_uas": 0.7572203056,
11
+ "dep_las": 0.7145288854,
12
  "dep_las_per_type": {
13
  "dep": {
14
+ "p": 0.5542676502,
15
+ "r": 0.4251793473,
16
+ "f": 0.4812167648
17
  },
18
  "case": {
19
+ "p": 0.9020435069,
20
+ "r": 0.8295344326,
21
+ "f": 0.8642708268
22
  },
23
  "nmod:tmod": {
24
+ "p": 0.7832446809,
25
+ "r": 0.8013605442,
26
+ "f": 0.7921990585
27
  },
28
  "nummod": {
29
+ "p": 0.8815789474,
30
+ "r": 0.5802798135,
31
+ "f": 0.6998794697
32
  },
33
  "mark:clf": {
34
+ "p": 0.9339393939,
35
+ "r": 0.5747855278,
36
+ "f": 0.711613946
37
  },
38
  "auxpass": {
39
+ "p": 0.9095744681,
40
  "r": 0.9243243243,
41
+ "f": 0.9168900804
42
  },
43
  "nsubj": {
44
+ "p": 0.8642424242,
45
+ "r": 0.7882324039,
46
+ "f": 0.8244892715
47
  },
48
  "acl": {
49
+ "p": 0.7845096814,
50
+ "r": 0.6966167499,
51
+ "f": 0.7379553467
52
  },
53
  "advmod": {
54
+ "p": 0.868605557,
55
+ "r": 0.7583314441,
56
+ "f": 0.8097312999
57
  },
58
  "mark": {
59
+ "p": 0.8348993289,
60
+ "r": 0.8177037686,
61
+ "f": 0.8262120877
62
  },
63
  "xcomp": {
64
+ "p": 0.8014981273,
65
+ "r": 0.6970684039,
66
+ "f": 0.7456445993
67
  },
68
  "nmod:assmod": {
69
+ "p": 0.8492146597,
70
+ "r": 0.7572362278,
71
+ "f": 0.8005923001
72
  },
73
  "det": {
74
+ "p": 0.8788617886,
75
+ "r": 0.633274751,
76
+ "f": 0.7361252979
77
  },
78
  "amod": {
79
+ "p": 0.8216442174,
80
+ "r": 0.6948153967,
81
+ "f": 0.7529261545
82
  },
83
  "nmod:prep": {
84
+ "p": 0.8173109819,
85
+ "r": 0.7226255293,
86
+ "f": 0.7670573126
87
  },
88
  "root": {
89
+ "p": 0.7621591746,
90
+ "r": 0.6886965207,
91
+ "f": 0.723567993
92
  },
93
  "aux:prtmod": {
94
+ "p": 0.9551020408,
95
+ "r": 0.8357142857,
96
+ "f": 0.8914285714
97
  },
98
  "compound:nn": {
99
+ "p": 0.7833185448,
100
+ "r": 0.7468697124,
101
+ "f": 0.764660026
102
  },
103
  "dobj": {
104
+ "p": 0.8932703275,
105
+ "r": 0.8120278477,
106
+ "f": 0.8507138423
107
  },
108
  "ccomp": {
109
+ "p": 0.7626977519,
110
+ "r": 0.7122861586,
111
+ "f": 0.7366304785
112
  },
113
  "advmod:rcomp": {
114
+ "p": 0.8369230769,
115
+ "r": 0.7534626039,
116
+ "f": 0.7930029155
117
  },
118
  "nmod:topic": {
119
+ "p": 0.4624505929,
120
+ "r": 0.3798701299,
121
+ "f": 0.4171122995
122
  },
123
  "cop": {
124
+ "p": 0.8350515464,
125
+ "r": 0.6254826255,
126
+ "f": 0.7152317881
127
  },
128
  "discourse": {
129
+ "p": 0.5836267606,
130
+ "r": 0.547029703,
131
+ "f": 0.5647359455
132
  },
133
  "neg": {
134
+ "p": 0.8730650155,
135
+ "r": 0.6706302021,
136
+ "f": 0.7585743107
137
  },
138
  "aux:modal": {
139
+ "p": 0.8915401302,
140
+ "r": 0.8500517063,
141
+ "f": 0.870301747
142
  },
143
  "nmod": {
144
+ "p": 0.7740524781,
145
+ "r": 0.7204884668,
146
+ "f": 0.7463106114
147
  },
148
  "aux:ba": {
149
+ "p": 0.9106145251,
150
+ "r": 0.8670212766,
151
+ "f": 0.8882833787
152
  },
153
  "advmod:loc": {
154
+ "p": 0.7519379845,
155
+ "r": 0.5756676558,
156
+ "f": 0.6521008403
157
  },
158
  "aux:asp": {
159
+ "p": 0.9163179916,
160
+ "r": 0.8732057416,
161
+ "f": 0.894242548
162
  },
163
  "conj": {
164
+ "p": 0.6111647672,
165
+ "r": 0.5981096408,
166
+ "f": 0.6045667335
167
  },
168
  "nsubjpass": {
169
+ "p": 0.9,
170
+ "r": 0.72,
171
+ "f": 0.8
172
  },
173
  "compound:vc": {
174
+ "p": 0.4628820961,
175
+ "r": 0.5492227979,
176
+ "f": 0.5023696682
177
  },
178
  "advcl:loc": {
179
+ "p": 0.6488549618,
180
+ "r": 0.6071428571,
181
+ "f": 0.6273062731
182
  },
183
  "cc": {
184
+ "p": 0.7943396226,
185
+ "r": 0.7471162378,
186
+ "f": 0.7700045725
187
  },
188
  "advmod:dvp": {
189
+ "p": 0.9212598425,
190
  "r": 0.7267080745,
191
+ "f": 0.8125
 
 
 
 
 
192
  },
193
  "appos": {
194
+ "p": 0.9382716049,
195
+ "r": 0.8735632184,
196
+ "f": 0.9047619048
197
  },
198
  "nmod:poss": {
199
+ "p": 0.7280701754,
200
+ "r": 0.6148148148,
201
+ "f": 0.6666666667
202
  },
203
  "name": {
204
+ "p": 0.6261682243,
205
+ "r": 0.4962962963,
206
+ "f": 0.5537190083
207
  },
208
  "nsubj:xsubj": {
209
  "p": 0.0,
211
  "f": 0.0
212
  },
213
  "nmod:range": {
214
+ "p": 0.8098859316,
215
+ "r": 0.7147651007,
216
+ "f": 0.7593582888
217
  },
218
  "parataxis:prnmod": {
219
+ "p": 0.3442622951,
220
+ "r": 0.1578947368,
221
+ "f": 0.2164948454
222
+ },
223
+ "amod:ordmod": {
224
+ "p": 0.7547169811,
225
+ "r": 0.625,
226
+ "f": 0.6837606838
227
  },
228
  "erased": {
229
  "p": 0.0,
231
  "f": 0.0
232
  },
233
  "etc": {
234
+ "p": 0.9277108434,
235
+ "r": 0.9166666667,
236
+ "f": 0.9221556886
237
  }
238
  },
239
+ "ents_p": 0.7608897127,
240
+ "ents_r": 0.7217582418,
241
+ "ents_f": 0.7408075795,
242
  "ents_per_type": {
243
  "DATE": {
244
+ "p": 0.7811607992,
245
+ "r": 0.8136769078,
246
+ "f": 0.7970873786
247
  },
248
  "GPE": {
249
+ "p": 0.8325837081,
250
+ "r": 0.8142717498,
251
+ "f": 0.8233259204
 
 
 
 
 
252
  },
253
  "ORDINAL": {
254
+ "p": 0.8488372093,
255
+ "r": 0.7684210526,
256
+ "f": 0.8066298343
257
  },
258
  "FAC": {
259
+ "p": 0.3906976744,
260
+ "r": 0.4516129032,
261
+ "f": 0.4189526185
 
 
 
 
 
 
 
 
 
 
262
  },
263
  "LOC": {
264
+ "p": 0.5012406948,
265
+ "r": 0.5430107527,
266
+ "f": 0.5212903226
267
  },
268
  "QUANTITY": {
269
+ "p": 0.696,
270
+ "r": 0.6444444444,
271
+ "f": 0.6692307692
272
  },
273
+ "ORG": {
274
+ "p": 0.7461476075,
275
+ "r": 0.700152207,
276
+ "f": 0.7224185316
277
+ },
278
+ "PERSON": {
279
+ "p": 0.8739386022,
280
+ "r": 0.8621134021,
281
+ "f": 0.8679857282
282
+ },
283
+ "CARDINAL": {
284
+ "p": 0.6729088639,
285
+ "r": 0.5433467742,
286
+ "f": 0.6012269939
287
+ },
288
+ "NORP": {
289
+ "p": 0.6961038961,
290
+ "r": 0.5630252101,
291
+ "f": 0.6225319396
292
  },
293
  "WORK_OF_ART": {
294
+ "p": 0.5625,
295
+ "r": 0.3,
296
+ "f": 0.3913043478
297
+ },
298
+ "TIME": {
299
+ "p": 0.7875647668,
300
+ "r": 0.7378640777,
301
+ "f": 0.7619047619
302
  },
303
  "MONEY": {
304
+ "p": 0.9256198347,
305
  "r": 0.8296296296,
306
+ "f": 0.875
307
  },
308
  "EVENT": {
309
+ "p": 0.5430463576,
310
+ "r": 0.6029411765,
311
+ "f": 0.5714285714
 
 
 
 
 
 
 
 
 
 
312
  },
313
  "PERCENT": {
314
+ "p": 0.869047619,
315
+ "r": 0.8795180723,
316
+ "f": 0.874251497
317
+ },
318
+ "PRODUCT": {
319
+ "p": 0.3793103448,
320
+ "r": 0.2244897959,
321
+ "f": 0.2820512821
322
  },
323
  "LAW": {
324
+ "p": 0.3571428571,
325
+ "r": 0.25,
326
+ "f": 0.2941176471
327
  },
328
  "LANGUAGE": {
329
+ "p": 0.4666666667,
330
+ "r": 0.7777777778,
331
+ "f": 0.5833333333
332
  }
333
  },
334
+ "speed": 2677.6055974261
335
  }
config.cfg CHANGED
@@ -16,6 +16,7 @@ before_creation = null
16
  after_creation = null
17
  after_pipeline_creation = null
18
  batch_size = 64
 
19
 
20
  [nlp.tokenizer]
21
  @tokenizers = "spacy.zh.ChineseTokenizer"
@@ -45,10 +46,11 @@ use_upper = false
45
  nO = null
46
 
47
  [components.ner.model.tok2vec]
48
- @architectures = "spacy-transformers.TransformerListener.v1"
49
- grad_factor = 1.0
50
  upstream = "transformer"
51
  pooling = {"@layers":"reduce_mean.v1"}
 
52
 
53
  [components.parser]
54
  factory = "parser"
@@ -68,10 +70,11 @@ use_upper = false
68
  nO = null
69
 
70
  [components.parser.model.tok2vec]
71
- @architectures = "spacy-transformers.TransformerListener.v1"
72
- grad_factor = 1.0
73
  upstream = "transformer"
74
  pooling = {"@layers":"reduce_mean.v1"}
 
75
 
76
  [components.tagger]
77
  factory = "tagger"
@@ -86,32 +89,44 @@ nO = null
86
  normalize = false
87
 
88
  [components.tagger.model.tok2vec]
89
- @architectures = "spacy-transformers.TransformerListener.v1"
90
- grad_factor = 1.0
91
  upstream = "transformer"
92
  pooling = {"@layers":"reduce_mean.v1"}
 
93
 
94
  [components.transformer]
95
- factory = "transformer"
96
- max_batch_items = 4096
97
- set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
98
 
99
  [components.transformer.model]
100
- name = "bert-base-chinese"
101
- @architectures = "spacy-transformers.TransformerModel.v3"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
102
  mixed_precision = false
103
-
104
- [components.transformer.model.get_spans]
105
- @span_getters = "spacy-transformers.strided_spans.v1"
106
- window = 128
107
- stride = 96
108
 
109
  [components.transformer.model.grad_scaler_config]
110
 
111
- [components.transformer.model.tokenizer_config]
112
- use_fast = true
113
-
114
- [components.transformer.model.transformer_config]
 
115
 
116
  [corpora]
117
 
@@ -148,11 +163,11 @@ annotating_components = []
148
  before_update = null
149
 
150
  [training.batcher]
151
- @batchers = "spacy.batch_by_padded.v1"
152
- discard_oversize = true
153
- get_length = null
154
  size = 2000
155
- buffer = 256
 
156
 
157
  [training.logger]
158
  @loggers = "spacy.ConsoleLogger.v1"
@@ -220,6 +235,18 @@ require = false
220
  path = "corpus/labels/tagger.json"
221
  require = false
222
 
 
 
 
 
 
 
 
 
 
 
 
 
223
  [initialize.lookups]
224
  @misc = "spacy.LookupsDataLoader.v1"
225
  lang = ${nlp.lang}
16
  after_creation = null
17
  after_pipeline_creation = null
18
  batch_size = 64
19
+ vectors = {"@vectors":"spacy.Vectors.v1"}
20
 
21
  [nlp.tokenizer]
22
  @tokenizers = "spacy.zh.ChineseTokenizer"
46
  nO = null
47
 
48
  [components.ner.model.tok2vec]
49
+ @architectures = "spacy-curated-transformers.LastTransformerLayerListener.v1"
50
+ width = ${components.transformer.model.hidden_width}
51
  upstream = "transformer"
52
  pooling = {"@layers":"reduce_mean.v1"}
53
+ grad_factor = 1.0
54
 
55
  [components.parser]
56
  factory = "parser"
70
  nO = null
71
 
72
  [components.parser.model.tok2vec]
73
+ @architectures = "spacy-curated-transformers.LastTransformerLayerListener.v1"
74
+ width = ${components.transformer.model.hidden_width}
75
  upstream = "transformer"
76
  pooling = {"@layers":"reduce_mean.v1"}
77
+ grad_factor = 1.0
78
 
79
  [components.tagger]
80
  factory = "tagger"
89
  normalize = false
90
 
91
  [components.tagger.model.tok2vec]
92
+ @architectures = "spacy-curated-transformers.LastTransformerLayerListener.v1"
93
+ width = ${components.transformer.model.hidden_width}
94
  upstream = "transformer"
95
  pooling = {"@layers":"reduce_mean.v1"}
96
+ grad_factor = 1.0
97
 
98
  [components.transformer]
99
+ factory = "curated_transformer"
100
+ all_layer_outputs = false
101
+ frozen = false
102
 
103
  [components.transformer.model]
104
+ @architectures = "spacy-curated-transformers.BertTransformer.v1"
105
+ vocab_size = 21128
106
+ hidden_width = 768
107
+ piece_encoder = {"@architectures":"spacy-curated-transformers.BertWordpieceEncoder.v1"}
108
+ attention_probs_dropout_prob = 0.1
109
+ hidden_act = "gelu"
110
+ hidden_dropout_prob = 0.1
111
+ intermediate_width = 3072
112
+ layer_norm_eps = 0.0
113
+ max_position_embeddings = 512
114
+ model_max_length = 512
115
+ num_attention_heads = 12
116
+ num_hidden_layers = 12
117
+ padding_idx = 0
118
+ type_vocab_size = 2
119
+ torchscript = false
120
  mixed_precision = false
121
+ wrapped_listener = null
 
 
 
 
122
 
123
  [components.transformer.model.grad_scaler_config]
124
 
125
+ [components.transformer.model.with_spans]
126
+ @architectures = "spacy-curated-transformers.WithStridedSpans.v1"
127
+ stride = 152
128
+ window = 208
129
+ batch_size = 384
130
 
131
  [corpora]
132
 
163
  before_update = null
164
 
165
  [training.batcher]
166
+ @batchers = "spacy.batch_by_words.v1"
167
+ discard_oversize = false
 
168
  size = 2000
169
+ tolerance = 0.2
170
+ get_length = null
171
 
172
  [training.logger]
173
  @loggers = "spacy.ConsoleLogger.v1"
235
  path = "corpus/labels/tagger.json"
236
  require = false
237
 
238
+ [initialize.components.transformer]
239
+
240
+ [initialize.components.transformer.encoder_loader]
241
+ @model_loaders = "spacy-curated-transformers.HFTransformerEncoderLoader.v1"
242
+ name = "bert-base-chinese"
243
+ revision = "main"
244
+
245
+ [initialize.components.transformer.piecer_loader]
246
+ @model_loaders = "spacy-curated-transformers.HFPieceEncoderLoader.v1"
247
+ name = "bert-base-chinese"
248
+ revision = "main"
249
+
250
  [initialize.lookups]
251
  @misc = "spacy.LookupsDataLoader.v1"
252
  lang = ${nlp.lang}
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"zh",
3
  "name":"core_web_trf",
4
- "version":"3.6.1",
5
- "description":"Chinese transformer pipeline (bert-base-chinese). Components: transformer, tagger, parser, ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
- "spacy_version":">=3.6.0,<3.7.0",
11
- "spacy_git_version":"c067b5264",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -150,212 +150,207 @@
150
  "token_p":0.9458325855,
151
  "token_r":0.9136060443,
152
  "token_f":0.9294400505,
153
- "tag_acc":0.9248343224,
154
- "sents_p":0.7267431276,
155
- "sents_r":0.6645580156,
156
- "sents_f":0.6942608696,
157
- "dep_uas":0.7702832979,
158
- "dep_las":0.7326537539,
159
  "dep_las_per_type":{
160
  "dep":{
161
- "p":0.5677689191,
162
- "r":0.4389208851,
163
- "f":0.4950991566
164
  },
165
  "case":{
166
- "p":0.9181494662,
167
- "r":0.8445683802,
168
- "f":0.8798231765
169
  },
170
  "nmod:tmod":{
171
- "p":0.8106995885,
172
- "r":0.8040816327,
173
- "f":0.8073770492
174
  },
175
  "nummod":{
176
- "p":0.9027635619,
177
- "r":0.5876082612,
178
- "f":0.7118644068
179
  },
180
  "mark:clf":{
181
- "p":0.9524691358,
182
- "r":0.5755315181,
183
- "f":0.7175075564
184
  },
185
  "auxpass":{
186
- "p":0.9243243243,
187
  "r":0.9243243243,
188
- "f":0.9243243243
189
  },
190
  "nsubj":{
191
- "p":0.8731413262,
192
- "r":0.8006387422,
193
- "f":0.8353197488
194
  },
195
  "acl":{
196
- "p":0.815270936,
197
- "r":0.7343316694,
198
- "f":0.7726874818
199
  },
200
  "advmod":{
201
- "p":0.8811971373,
202
- "r":0.7676263886,
203
- "f":0.8205003938
204
  },
205
  "mark":{
206
- "p":0.8466637207,
207
- "r":0.8396143734,
208
- "f":0.8431243124
209
  },
210
  "xcomp":{
211
- "p":0.8116760829,
212
- "r":0.7019543974,
213
- "f":0.7528384279
214
  },
215
  "nmod:assmod":{
216
- "p":0.8690516369,
217
- "r":0.8014316838,
218
- "f":0.833873057
219
  },
220
  "det":{
221
- "p":0.8931726908,
222
- "r":0.6514352665,
223
- "f":0.7533875339
224
  },
225
  "amod":{
226
- "p":0.8383475528,
227
- "r":0.7333071485,
228
- "f":0.7823172009
229
  },
230
  "nmod:prep":{
231
- "p":0.839443313,
232
- "r":0.7480338778,
233
- "f":0.7911068458
234
  },
235
  "root":{
236
- "p":0.7950441798,
237
- "r":0.6890294656,
238
- "f":0.7382502453
239
  },
240
  "aux:prtmod":{
241
- "p":0.9437751004,
242
- "r":0.8392857143,
243
- "f":0.8884688091
244
  },
245
  "compound:nn":{
246
- "p":0.8118741059,
247
- "r":0.7681895093,
248
- "f":0.7894279256
249
  },
250
  "dobj":{
251
- "p":0.9199408187,
252
- "r":0.8289142349,
253
- "f":0.8720585944
254
  },
255
  "ccomp":{
256
- "p":0.7878282618,
257
- "r":0.734836703,
258
- "f":0.7604103802
259
  },
260
  "advmod:rcomp":{
261
- "p":0.8501529052,
262
- "r":0.7700831025,
263
- "f":0.8081395349
264
  },
265
  "nmod:topic":{
266
- "p":0.5123674912,
267
- "r":0.4707792208,
268
- "f":0.4906937394
269
  },
270
  "cop":{
271
- "p":0.8493150685,
272
- "r":0.6383526384,
273
- "f":0.7288758266
274
  },
275
  "discourse":{
276
- "p":0.6115044248,
277
- "r":0.5701320132,
278
- "f":0.5900939368
279
  },
280
  "neg":{
281
- "p":0.8767334361,
282
- "r":0.6765755054,
283
- "f":0.7637583893
284
  },
285
  "aux:modal":{
286
- "p":0.9025191676,
287
- "r":0.8521199586,
288
- "f":0.8765957447
289
  },
290
  "nmod":{
291
- "p":0.8147612156,
292
- "r":0.7639077341,
293
- "f":0.7885154062
294
  },
295
  "aux:ba":{
296
- "p":0.9222222222,
297
- "r":0.8829787234,
298
- "f":0.902173913
299
  },
300
  "advmod:loc":{
301
- "p":0.8146718147,
302
- "r":0.6261127596,
303
- "f":0.7080536913
304
  },
305
  "aux:asp":{
306
- "p":0.930153322,
307
- "r":0.8708133971,
308
- "f":0.8995057661
309
  },
310
  "conj":{
311
- "p":0.6438065883,
312
- "r":0.631758034,
313
- "f":0.6377254079
314
  },
315
  "nsubjpass":{
316
- "p":0.8913043478,
317
- "r":0.82,
318
- "f":0.8541666667
319
  },
320
  "compound:vc":{
321
- "p":0.5483870968,
322
- "r":0.6165803109,
323
- "f":0.5804878049
324
  },
325
  "advcl:loc":{
326
- "p":0.7307692308,
327
- "r":0.6785714286,
328
- "f":0.7037037037
329
  },
330
  "cc":{
331
- "p":0.8328530259,
332
- "r":0.769299024,
333
- "f":0.7998154982
334
  },
335
  "advmod:dvp":{
336
- "p":0.893129771,
337
  "r":0.7267080745,
338
- "f":0.801369863
339
- },
340
- "amod:ordmod":{
341
- "p":0.6885245902,
342
- "r":0.65625,
343
- "f":0.672
344
  },
345
  "appos":{
346
- "p":0.9581280788,
347
- "r":0.8942528736,
348
- "f":0.9250891795
349
  },
350
  "nmod:poss":{
351
- "p":0.7807017544,
352
- "r":0.6592592593,
353
- "f":0.7148594378
354
  },
355
  "name":{
356
- "p":0.6517857143,
357
- "r":0.5407407407,
358
- "f":0.5910931174
359
  },
360
  "nsubj:xsubj":{
361
  "p":0.0,
@@ -363,14 +358,19 @@
363
  "f":0.0
364
  },
365
  "nmod:range":{
366
- "p":0.8301158301,
367
- "r":0.7214765101,
368
- "f":0.7719928187
369
  },
370
  "parataxis:prnmod":{
371
- "p":0.3647058824,
372
- "r":0.2330827068,
373
- "f":0.2844036697
 
 
 
 
 
374
  },
375
  "erased":{
376
  "p":0.0,
@@ -378,107 +378,107 @@
378
  "f":0.0
379
  },
380
  "etc":{
381
- "p":0.8965517241,
382
- "r":0.9285714286,
383
- "f":0.9122807018
384
  }
385
  },
386
- "ents_p":0.7588215895,
387
- "ents_r":0.7585714286,
388
- "ents_f":0.7586964884,
389
  "ents_per_type":{
390
  "DATE":{
391
- "p":0.7731568998,
392
- "r":0.810703667,
393
- "f":0.7914852443
394
  },
395
  "GPE":{
396
- "p":0.7989154993,
397
- "r":0.8641251222,
398
- "f":0.8302418408
399
- },
400
- "CARDINAL":{
401
- "p":0.649321267,
402
- "r":0.5786290323,
403
- "f":0.6119402985
404
  },
405
  "ORDINAL":{
406
- "p":0.8622754491,
407
- "r":0.7578947368,
408
- "f":0.8067226891
409
  },
410
  "FAC":{
411
- "p":0.4974358974,
412
- "r":0.5215053763,
413
- "f":0.5091863517
414
- },
415
- "ORG":{
416
- "p":0.749235474,
417
- "r":0.7458143075,
418
- "f":0.7475209764
419
- },
420
- "NORP":{
421
- "p":0.6605080831,
422
- "r":0.6008403361,
423
- "f":0.6292629263
424
  },
425
  "LOC":{
426
- "p":0.6323987539,
427
- "r":0.5456989247,
428
- "f":0.5858585859
429
  },
430
  "QUANTITY":{
431
- "p":0.7244094488,
432
- "r":0.6814814815,
433
- "f":0.7022900763
434
  },
435
- "TIME":{
436
- "p":0.7627906977,
437
- "r":0.7961165049,
438
- "f":0.7790973872
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
439
  },
440
  "WORK_OF_ART":{
441
- "p":0.4444444444,
442
- "r":0.32,
443
- "f":0.3720930233
 
 
 
 
 
444
  },
445
  "MONEY":{
446
- "p":0.896,
447
  "r":0.8296296296,
448
- "f":0.8615384615
449
  },
450
  "EVENT":{
451
- "p":0.6026490066,
452
- "r":0.6691176471,
453
- "f":0.6341463415
454
- },
455
- "PRODUCT":{
456
- "p":0.4722222222,
457
- "r":0.3469387755,
458
- "f":0.4
459
- },
460
- "PERSON":{
461
- "p":0.8785803238,
462
- "r":0.9091494845,
463
- "f":0.8936035465
464
  },
465
  "PERCENT":{
466
- "p":0.7888888889,
467
- "r":0.8554216867,
468
- "f":0.8208092486
 
 
 
 
 
469
  },
470
  "LAW":{
471
- "p":0.375,
472
- "r":0.3,
473
- "f":0.3333333333
474
  },
475
  "LANGUAGE":{
476
- "p":0.75,
477
- "r":1.0,
478
- "f":0.8571428571
479
  }
480
  },
481
- "speed":3083.8656241516
482
  },
483
  "sources":[
484
  {
@@ -501,7 +501,7 @@
501
  }
502
  ],
503
  "requirements":[
504
- "spacy-transformers>=1.2.2,<1.3.0",
505
  "spacy-pkuseg>=0.0.27,<0.1.0"
506
  ]
507
  }
1
  {
2
  "lang":"zh",
3
  "name":"core_web_trf",
4
+ "version":"3.7.2",
5
+ "description":"Chinese transformer pipeline (Transformer(name='bert-base-chinese', piece_encoder='bert-wordpiece', stride=152, type='bert', width=768, window=208, vocab_size=21128)). Components: transformer, tagger, parser, ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
+ "spacy_version":">=3.7.0,<3.8.0",
11
+ "spacy_git_version":"4ec41e98f",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
150
  "token_p":0.9458325855,
151
  "token_r":0.9136060443,
152
  "token_f":0.9294400505,
153
+ "tag_acc":0.9175332527,
154
+ "sents_p":0.7092434038,
155
+ "sents_r":0.6757116697,
156
+ "sents_f":0.6920716113,
157
+ "dep_uas":0.7572203056,
158
+ "dep_las":0.7145288854,
159
  "dep_las_per_type":{
160
  "dep":{
161
+ "p":0.5542676502,
162
+ "r":0.4251793473,
163
+ "f":0.4812167648
164
  },
165
  "case":{
166
+ "p":0.9020435069,
167
+ "r":0.8295344326,
168
+ "f":0.8642708268
169
  },
170
  "nmod:tmod":{
171
+ "p":0.7832446809,
172
+ "r":0.8013605442,
173
+ "f":0.7921990585
174
  },
175
  "nummod":{
176
+ "p":0.8815789474,
177
+ "r":0.5802798135,
178
+ "f":0.6998794697
179
  },
180
  "mark:clf":{
181
+ "p":0.9339393939,
182
+ "r":0.5747855278,
183
+ "f":0.711613946
184
  },
185
  "auxpass":{
186
+ "p":0.9095744681,
187
  "r":0.9243243243,
188
+ "f":0.9168900804
189
  },
190
  "nsubj":{
191
+ "p":0.8642424242,
192
+ "r":0.7882324039,
193
+ "f":0.8244892715
194
  },
195
  "acl":{
196
+ "p":0.7845096814,
197
+ "r":0.6966167499,
198
+ "f":0.7379553467
199
  },
200
  "advmod":{
201
+ "p":0.868605557,
202
+ "r":0.7583314441,
203
+ "f":0.8097312999
204
  },
205
  "mark":{
206
+ "p":0.8348993289,
207
+ "r":0.8177037686,
208
+ "f":0.8262120877
209
  },
210
  "xcomp":{
211
+ "p":0.8014981273,
212
+ "r":0.6970684039,
213
+ "f":0.7456445993
214
  },
215
  "nmod:assmod":{
216
+ "p":0.8492146597,
217
+ "r":0.7572362278,
218
+ "f":0.8005923001
219
  },
220
  "det":{
221
+ "p":0.8788617886,
222
+ "r":0.633274751,
223
+ "f":0.7361252979
224
  },
225
  "amod":{
226
+ "p":0.8216442174,
227
+ "r":0.6948153967,
228
+ "f":0.7529261545
229
  },
230
  "nmod:prep":{
231
+ "p":0.8173109819,
232
+ "r":0.7226255293,
233
+ "f":0.7670573126
234
  },
235
  "root":{
236
+ "p":0.7621591746,
237
+ "r":0.6886965207,
238
+ "f":0.723567993
239
  },
240
  "aux:prtmod":{
241
+ "p":0.9551020408,
242
+ "r":0.8357142857,
243
+ "f":0.8914285714
244
  },
245
  "compound:nn":{
246
+ "p":0.7833185448,
247
+ "r":0.7468697124,
248
+ "f":0.764660026
249
  },
250
  "dobj":{
251
+ "p":0.8932703275,
252
+ "r":0.8120278477,
253
+ "f":0.8507138423
254
  },
255
  "ccomp":{
256
+ "p":0.7626977519,
257
+ "r":0.7122861586,
258
+ "f":0.7366304785
259
  },
260
  "advmod:rcomp":{
261
+ "p":0.8369230769,
262
+ "r":0.7534626039,
263
+ "f":0.7930029155
264
  },
265
  "nmod:topic":{
266
+ "p":0.4624505929,
267
+ "r":0.3798701299,
268
+ "f":0.4171122995
269
  },
270
  "cop":{
271
+ "p":0.8350515464,
272
+ "r":0.6254826255,
273
+ "f":0.7152317881
274
  },
275
  "discourse":{
276
+ "p":0.5836267606,
277
+ "r":0.547029703,
278
+ "f":0.5647359455
279
  },
280
  "neg":{
281
+ "p":0.8730650155,
282
+ "r":0.6706302021,
283
+ "f":0.7585743107
284
  },
285
  "aux:modal":{
286
+ "p":0.8915401302,
287
+ "r":0.8500517063,
288
+ "f":0.870301747
289
  },
290
  "nmod":{
291
+ "p":0.7740524781,
292
+ "r":0.7204884668,
293
+ "f":0.7463106114
294
  },
295
  "aux:ba":{
296
+ "p":0.9106145251,
297
+ "r":0.8670212766,
298
+ "f":0.8882833787
299
  },
300
  "advmod:loc":{
301
+ "p":0.7519379845,
302
+ "r":0.5756676558,
303
+ "f":0.6521008403
304
  },
305
  "aux:asp":{
306
+ "p":0.9163179916,
307
+ "r":0.8732057416,
308
+ "f":0.894242548
309
  },
310
  "conj":{
311
+ "p":0.6111647672,
312
+ "r":0.5981096408,
313
+ "f":0.6045667335
314
  },
315
  "nsubjpass":{
316
+ "p":0.9,
317
+ "r":0.72,
318
+ "f":0.8
319
  },
320
  "compound:vc":{
321
+ "p":0.4628820961,
322
+ "r":0.5492227979,
323
+ "f":0.5023696682
324
  },
325
  "advcl:loc":{
326
+ "p":0.6488549618,
327
+ "r":0.6071428571,
328
+ "f":0.6273062731
329
  },
330
  "cc":{
331
+ "p":0.7943396226,
332
+ "r":0.7471162378,
333
+ "f":0.7700045725
334
  },
335
  "advmod:dvp":{
336
+ "p":0.9212598425,
337
  "r":0.7267080745,
338
+ "f":0.8125
 
 
 
 
 
339
  },
340
  "appos":{
341
+ "p":0.9382716049,
342
+ "r":0.8735632184,
343
+ "f":0.9047619048
344
  },
345
  "nmod:poss":{
346
+ "p":0.7280701754,
347
+ "r":0.6148148148,
348
+ "f":0.6666666667
349
  },
350
  "name":{
351
+ "p":0.6261682243,
352
+ "r":0.4962962963,
353
+ "f":0.5537190083
354
  },
355
  "nsubj:xsubj":{
356
  "p":0.0,
358
  "f":0.0
359
  },
360
  "nmod:range":{
361
+ "p":0.8098859316,
362
+ "r":0.7147651007,
363
+ "f":0.7593582888
364
  },
365
  "parataxis:prnmod":{
366
+ "p":0.3442622951,
367
+ "r":0.1578947368,
368
+ "f":0.2164948454
369
+ },
370
+ "amod:ordmod":{
371
+ "p":0.7547169811,
372
+ "r":0.625,
373
+ "f":0.6837606838
374
  },
375
  "erased":{
376
  "p":0.0,
378
  "f":0.0
379
  },
380
  "etc":{
381
+ "p":0.9277108434,
382
+ "r":0.9166666667,
383
+ "f":0.9221556886
384
  }
385
  },
386
+ "ents_p":0.7608897127,
387
+ "ents_r":0.7217582418,
388
+ "ents_f":0.7408075795,
389
  "ents_per_type":{
390
  "DATE":{
391
+ "p":0.7811607992,
392
+ "r":0.8136769078,
393
+ "f":0.7970873786
394
  },
395
  "GPE":{
396
+ "p":0.8325837081,
397
+ "r":0.8142717498,
398
+ "f":0.8233259204
 
 
 
 
 
399
  },
400
  "ORDINAL":{
401
+ "p":0.8488372093,
402
+ "r":0.7684210526,
403
+ "f":0.8066298343
404
  },
405
  "FAC":{
406
+ "p":0.3906976744,
407
+ "r":0.4516129032,
408
+ "f":0.4189526185
 
 
 
 
 
 
 
 
 
 
409
  },
410
  "LOC":{
411
+ "p":0.5012406948,
412
+ "r":0.5430107527,
413
+ "f":0.5212903226
414
  },
415
  "QUANTITY":{
416
+ "p":0.696,
417
+ "r":0.6444444444,
418
+ "f":0.6692307692
419
  },
420
+ "ORG":{
421
+ "p":0.7461476075,
422
+ "r":0.700152207,
423
+ "f":0.7224185316
424
+ },
425
+ "PERSON":{
426
+ "p":0.8739386022,
427
+ "r":0.8621134021,
428
+ "f":0.8679857282
429
+ },
430
+ "CARDINAL":{
431
+ "p":0.6729088639,
432
+ "r":0.5433467742,
433
+ "f":0.6012269939
434
+ },
435
+ "NORP":{
436
+ "p":0.6961038961,
437
+ "r":0.5630252101,
438
+ "f":0.6225319396
439
  },
440
  "WORK_OF_ART":{
441
+ "p":0.5625,
442
+ "r":0.3,
443
+ "f":0.3913043478
444
+ },
445
+ "TIME":{
446
+ "p":0.7875647668,
447
+ "r":0.7378640777,
448
+ "f":0.7619047619
449
  },
450
  "MONEY":{
451
+ "p":0.9256198347,
452
  "r":0.8296296296,
453
+ "f":0.875
454
  },
455
  "EVENT":{
456
+ "p":0.5430463576,
457
+ "r":0.6029411765,
458
+ "f":0.5714285714
 
 
 
 
 
 
 
 
 
 
459
  },
460
  "PERCENT":{
461
+ "p":0.869047619,
462
+ "r":0.8795180723,
463
+ "f":0.874251497
464
+ },
465
+ "PRODUCT":{
466
+ "p":0.3793103448,
467
+ "r":0.2244897959,
468
+ "f":0.2820512821
469
  },
470
  "LAW":{
471
+ "p":0.3571428571,
472
+ "r":0.25,
473
+ "f":0.2941176471
474
  },
475
  "LANGUAGE":{
476
+ "p":0.4666666667,
477
+ "r":0.7777777778,
478
+ "f":0.5833333333
479
  }
480
  },
481
+ "speed":2677.6055974261
482
  },
483
  "sources":[
484
  {
501
  }
502
  ],
503
  "requirements":[
504
+ "spacy-curated-transformers>=0.2.0,<0.3.0",
505
  "spacy-pkuseg>=0.0.27,<0.1.0"
506
  ]
507
  }
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67c041beffde3016c8b575b9a83ee019899b3503663171c20b6ba8ffbea0cc44
3
- size 313773
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aef2e9eb9ee946c4e7f7270a114a937153fc8dcc18940a71b8bda2b0c2966c2c
3
+ size 313857
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f73d923619d1e64ff59d0b5611760ba5f70e377e3ebd41dfe5709fd8c237520b
3
- size 460325
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9abe94d98e205bedaf1ccc123a88fa576102e49645c5113d6f97a04174537f23
3
+ size 460409
tagger/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2df04965f6b319ed3f7e65ccc9b889db8d49eee38af6308eabd443ecc515ead6
3
- size 111378
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b6510e3b24c0049faf0ab083518978008cce5a3f975e3391e1013c02ff83b72
3
+ size 111462
transformer/cfg CHANGED
@@ -1,3 +1,3 @@
1
  {
2
- "max_batch_items":4096
3
  }
1
  {
2
+
3
  }
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef125549e20637cf0a9f3d8a36479576f66af72948d7a293e030b8c783810b51
3
- size 409701271
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bee996afd07caae39d7d3d89d1c6be8afc658688768f3aac411ed6ee32dbefd8
3
+ size 406876262
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa4f41317b81e784ac4c657a83e98e7c6d18f44ff5d815800d67fa398182f621
3
- size 1216856
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:294990baaab33a255307e97829ac7de76d9f2f8a364fad0425007c11fa89c258
3
+ size 1216969
zh_core_web_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71fcb96195a86c06e8c59e7d487aa0d70e81064c9efbd00c5bfa26dd16d3b617
3
- size 417445033
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16b8d4bf23d20a04cfcbe676ae1be2be4437b40cf8101c9f3e7f6db4674ec91d
3
+ size 415134745