adrianeboyd commited on
Commit
d9c0885
1 Parent(s): 1038cbb

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,49 +14,49 @@ model-index:
14
  metrics:
15
  - name: TAG (XPOS) Accuracy
16
  type: accuracy
17
- value: 0.990643584
18
  - task:
19
  name: POS
20
  type: token-classification
21
  metrics:
22
  - name: POS (UPOS) Accuracy
23
  type: accuracy
24
- value: 0.9915288956
25
  - task:
26
  name: MORPH
27
  type: token-classification
28
  metrics:
29
  - name: Morph (UFeats) Accuracy
30
  type: accuracy
31
- value: 0.9699941191
32
  - task:
33
  name: LEMMA
34
  type: token-classification
35
  metrics:
36
  - name: Lemma Accuracy
37
  type: accuracy
38
- value: 0.9873800777
39
  - task:
40
  name: UNLABELED_DEPENDENCIES
41
  type: token-classification
42
  metrics:
43
  - name: Unlabeled Attachment Score (UAS)
44
  type: f_score
45
- value: 0.9593756103
46
  - task:
47
  name: LABELED_DEPENDENCIES
48
  type: token-classification
49
  metrics:
50
  - name: Labeled Attachment Score (LAS)
51
  type: f_score
52
- value: 0.9480405339
53
  - task:
54
  name: SENTS
55
  type: token-classification
56
  metrics:
57
  - name: Sentences F-Score
58
  type: f_score
59
- value: 0.9827461515
60
  ---
61
  ### Details: https://spacy.io/models/de#de_dep_news_trf
62
 
@@ -65,8 +65,8 @@ German transformer pipeline (bert-base-german-cased). Components: transformer, t
65
  | Feature | Description |
66
  | --- | --- |
67
  | **Name** | `de_dep_news_trf` |
68
- | **Version** | `3.5.0` |
69
- | **spaCy** | `>=3.5.0,<3.6.0` |
70
  | **Default Pipeline** | `transformer`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler` |
71
  | **Components** | `transformer`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler` |
72
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -98,13 +98,13 @@ German transformer pipeline (bert-base-german-cased). Components: transformer, t
98
  | `TOKEN_F` | 99.91 |
99
  | `TAG_ACC` | 99.06 |
100
  | `POS_ACC` | 99.15 |
101
- | `MORPH_ACC` | 97.00 |
102
- | `MORPH_MICRO_P` | 98.83 |
103
- | `MORPH_MICRO_R` | 98.87 |
104
  | `MORPH_MICRO_F` | 98.85 |
105
- | `SENTS_P` | 98.26 |
106
- | `SENTS_R` | 98.28 |
107
- | `SENTS_F` | 98.27 |
108
- | `DEP_UAS` | 95.94 |
109
- | `DEP_LAS` | 94.80 |
110
- | `LEMMA_ACC` | 98.74 |
 
14
  metrics:
15
  - name: TAG (XPOS) Accuracy
16
  type: accuracy
17
+ value: 0.9905775076
18
  - task:
19
  name: POS
20
  type: token-classification
21
  metrics:
22
  - name: POS (UPOS) Accuracy
23
  type: accuracy
24
+ value: 0.9914628183
25
  - task:
26
  name: MORPH
27
  type: token-classification
28
  metrics:
29
  - name: Morph (UFeats) Accuracy
30
  type: accuracy
31
+ value: 0.9700866279
32
  - task:
33
  name: LEMMA
34
  type: token-classification
35
  metrics:
36
  - name: Lemma Accuracy
37
  type: accuracy
38
+ value: 0.9872611465
39
  - task:
40
  name: UNLABELED_DEPENDENCIES
41
  type: token-classification
42
  metrics:
43
  - name: Unlabeled Attachment Score (UAS)
44
  type: f_score
45
+ value: 0.9592566441
46
  - task:
47
  name: LABELED_DEPENDENCIES
48
  type: token-classification
49
  metrics:
50
  - name: Labeled Attachment Score (LAS)
51
  type: f_score
52
+ value: 0.9484326996
53
  - task:
54
  name: SENTS
55
  type: token-classification
56
  metrics:
57
  - name: Sentences F-Score
58
  type: f_score
59
+ value: 0.9797854785
60
  ---
61
  ### Details: https://spacy.io/models/de#de_dep_news_trf
62
 
 
65
  | Feature | Description |
66
  | --- | --- |
67
  | **Name** | `de_dep_news_trf` |
68
+ | **Version** | `3.6.1` |
69
+ | **spaCy** | `>=3.6.0,<3.7.0` |
70
  | **Default Pipeline** | `transformer`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler` |
71
  | **Components** | `transformer`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler` |
72
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
98
  | `TOKEN_F` | 99.91 |
99
  | `TAG_ACC` | 99.06 |
100
  | `POS_ACC` | 99.15 |
101
+ | `MORPH_ACC` | 97.01 |
102
+ | `MORPH_MICRO_P` | 98.86 |
103
+ | `MORPH_MICRO_R` | 98.84 |
104
  | `MORPH_MICRO_F` | 98.85 |
105
+ | `SENTS_P` | 97.80 |
106
+ | `SENTS_R` | 98.16 |
107
+ | `SENTS_F` | 97.98 |
108
+ | `DEP_UAS` | 95.93 |
109
+ | `DEP_LAS` | 94.84 |
110
+ | `LEMMA_ACC` | 98.73 |
accuracy.json CHANGED
@@ -3,62 +3,62 @@
3
  "token_p": 0.9991808044,
4
  "token_r": 0.9990356034,
5
  "token_f": 0.9991081986,
6
- "tag_acc": 0.990643584,
7
- "pos_acc": 0.9915288956,
8
- "morph_acc": 0.9699941191,
9
- "morph_micro_p": 0.9883140406,
10
- "morph_micro_r": 0.9886871127,
11
- "morph_micro_f": 0.9885005414,
12
  "morph_per_feat": {
13
  "Case": {
14
- "p": 0.9764129352,
15
- "r": 0.9784679312,
16
- "f": 0.9774393531
17
  },
18
  "Definite": {
19
- "p": 0.9996579247,
20
- "r": 0.9998859489,
21
- "f": 0.9997719238
22
  },
23
  "Gender": {
24
- "p": 0.9838005353,
25
- "r": 0.9855497855,
26
- "f": 0.9846743835
27
  },
28
  "Number": {
29
- "p": 0.9914020247,
30
- "r": 0.9936066713,
31
- "f": 0.9925031237
32
  },
33
  "PronType": {
34
- "p": 0.9982144306,
35
- "r": 0.9972431687,
36
- "f": 0.9977285633
37
  },
38
  "Degree": {
39
- "p": 0.995600915,
40
- "r": 0.9876069122,
41
- "f": 0.9915878023
42
  },
43
  "VerbForm": {
44
- "p": 0.9951794322,
45
- "r": 0.9975303339,
46
- "f": 0.9963534964
47
  },
48
  "Mood": {
49
- "p": 0.9903893952,
50
- "r": 0.991046261,
51
- "f": 0.9907177192
52
  },
53
  "Person": {
54
- "p": 0.9988956378,
55
- "r": 0.9994475138,
56
- "f": 0.9991714996
57
  },
58
  "Tense": {
59
- "p": 0.9970074813,
60
- "r": 0.9976709366,
61
- "f": 0.9973390986
62
  },
63
  "Reflex": {
64
  "p": 0.9976359338,
@@ -71,66 +71,66 @@
71
  "f": 1.0
72
  },
73
  "Foreign": {
74
- "p": 0.7916666667,
75
- "r": 0.1909547739,
76
- "f": 0.3076923077
77
  }
78
  },
79
- "sents_p": 0.9826446281,
80
- "sents_r": 0.9828476958,
81
- "sents_f": 0.9827461515,
82
- "dep_uas": 0.9593756103,
83
- "dep_las": 0.9480405339,
84
  "dep_las_per_type": {
85
  "cp": {
86
- "p": 0.9926605505,
87
- "r": 0.9890310786,
88
- "f": 0.9908424908
89
  },
90
  "nk": {
91
- "p": 0.9882434302,
92
- "r": 0.9892897866,
93
- "f": 0.9887663316
94
  },
95
  "sb": {
96
- "p": 0.9784172662,
97
  "r": 0.9780740221,
98
- "f": 0.978245614
99
  },
100
  "ag": {
101
- "p": 0.9753018661,
102
- "r": 0.9823106689,
103
- "f": 0.9787937207
104
  },
105
  "mnr": {
106
- "p": 0.8681462141,
107
- "r": 0.8385876419,
108
- "f": 0.8531109686
109
  },
110
  "mo": {
111
- "p": 0.8696529459,
112
- "r": 0.8719401173,
113
- "f": 0.8707950298
114
  },
115
  "oc": {
116
- "p": 0.961423445,
117
- "r": 0.9677904877,
118
- "f": 0.9645964596
119
  },
120
  "root": {
121
- "p": 0.9894628099,
122
- "r": 0.9896672866,
123
- "f": 0.9895650377
124
  },
125
  "rc": {
126
- "p": 0.8440979955,
127
- "r": 0.8497757848,
128
- "f": 0.8469273743
129
  },
130
  "op": {
131
- "p": 0.8141843972,
132
- "r": 0.8554396423,
133
- "f": 0.8343023256
134
  },
135
  "pm": {
136
  "p": 1.0,
@@ -138,84 +138,84 @@
138
  "f": 1.0
139
  },
140
  "nmc": {
141
- "p": 0.9872611465,
142
- "r": 0.9794628752,
143
- "f": 0.9833465504
144
  },
145
  "oa": {
146
- "p": 0.965085639,
147
- "r": 0.9663588391,
148
- "f": 0.9657218194
149
  },
150
  "pd": {
151
- "p": 0.9118110236,
152
- "r": 0.8514705882,
153
- "f": 0.880608365
154
  },
155
  "ep": {
156
- "p": 0.9393939394,
157
- "r": 0.9323308271,
158
- "f": 0.9358490566
159
  },
160
  "cd": {
161
- "p": 0.9336340206,
162
- "r": 0.9360465116,
163
- "f": 0.9348387097
164
  },
165
  "cj": {
166
- "p": 0.9113060429,
167
- "r": 0.9220907298,
168
- "f": 0.9166666667
169
  },
170
  "par": {
171
- "p": 0.5454545455,
172
- "r": 0.4117647059,
173
- "f": 0.469273743
174
  },
175
  "svp": {
176
- "p": 0.9727626459,
177
- "r": 0.9615384615,
178
- "f": 0.9671179884
179
  },
180
  "pg": {
181
- "p": 0.9140127389,
182
- "r": 0.9140127389,
183
- "f": 0.9140127389
184
  },
185
  "da": {
186
- "p": 0.9214659686,
187
- "r": 0.8956743003,
188
- "f": 0.9083870968
189
  },
190
  "app": {
191
- "p": 0.8052805281,
192
- "r": 0.8215488215,
193
- "f": 0.8133333333
194
  },
195
  "ac": {
196
- "p": 0.972972973,
197
- "r": 0.9230769231,
198
- "f": 0.9473684211
199
  },
200
  "pnc": {
201
- "p": 0.9001349528,
202
  "r": 0.8662337662,
203
- "f": 0.8828590338
204
  },
205
  "ju": {
206
- "p": 0.9117647059,
207
  "r": 0.9393939394,
208
- "f": 0.9253731343
209
  },
210
  "ng": {
211
- "p": 0.8710526316,
212
- "r": 0.8803191489,
213
- "f": 0.8756613757
214
  },
215
  "re": {
216
- "p": 0.8117647059,
217
- "r": 0.8214285714,
218
- "f": 0.8165680473
219
  },
220
  "dep": {
221
  "p": 0.0,
@@ -223,44 +223,44 @@
223
  "f": 0.0
224
  },
225
  "cm": {
226
- "p": 0.9565217391,
227
- "r": 0.9519230769,
228
- "f": 0.9542168675
229
  },
230
  "cc": {
231
- "p": 0.7837837838,
232
- "r": 0.7286432161,
233
- "f": 0.7552083333
234
  },
235
  "sbp": {
236
- "p": 0.963963964,
237
- "r": 0.9224137931,
238
- "f": 0.9427312775
239
  },
240
  "uc": {
241
- "p": 0.6818181818,
242
- "r": 0.5,
243
- "f": 0.5769230769
244
  },
245
  "cvc": {
246
- "p": 0.7901234568,
247
- "r": 0.8101265823,
248
  "f": 0.8
249
  },
250
  "ams": {
251
- "p": 0.7948717949,
252
- "r": 0.9117647059,
253
- "f": 0.8493150685
254
  },
255
  "rs": {
256
- "p": 0.8235294118,
257
  "r": 0.4516129032,
258
- "f": 0.5833333333
259
  },
260
  "ph": {
261
- "p": 0.8571428571,
262
- "r": 0.8571428571,
263
- "f": 0.8571428571
264
  },
265
  "dm": {
266
  "p": 1.0,
@@ -278,9 +278,9 @@
278
  "f": 0.0
279
  },
280
  "og": {
281
- "p": 0.4545454545,
282
  "r": 0.7142857143,
283
- "f": 0.5555555556
284
  },
285
  "avc": {
286
  "p": 0.0,
@@ -293,6 +293,6 @@
293
  "f": 0.8571428571
294
  }
295
  },
296
- "lemma_acc": 0.9873800777,
297
- "speed": 5858.0470519607
298
  }
 
3
  "token_p": 0.9991808044,
4
  "token_r": 0.9990356034,
5
  "token_f": 0.9991081986,
6
+ "tag_acc": 0.9905775076,
7
+ "pos_acc": 0.9914628183,
8
+ "morph_acc": 0.9700866279,
9
+ "morph_micro_p": 0.9886266605,
10
+ "morph_micro_r": 0.9884199706,
11
+ "morph_micro_f": 0.9885233048,
12
  "morph_per_feat": {
13
  "Case": {
14
+ "p": 0.9763482571,
15
+ "r": 0.9779552629,
16
+ "f": 0.9771510993
17
  },
18
  "Definite": {
19
+ "p": 0.9996579637,
20
+ "r": 1.0,
21
+ "f": 0.9998289526
22
  },
23
  "Gender": {
24
+ "p": 0.9848792598,
25
+ "r": 0.9853240009,
26
+ "f": 0.9851015801
27
  },
28
  "Number": {
29
+ "p": 0.9918825162,
30
+ "r": 0.9934908501,
31
+ "f": 0.9926860317
32
  },
33
  "PronType": {
34
+ "p": 0.9982142857,
35
+ "r": 0.9971620855,
36
+ "f": 0.9976879082
37
  },
38
  "Degree": {
39
+ "p": 0.9956001408,
40
+ "r": 0.9874323617,
41
+ "f": 0.9914994304
42
  },
43
  "VerbForm": {
44
+ "p": 0.9950717806,
45
+ "r": 0.9973155804,
46
+ "f": 0.996192417
47
  },
48
  "Mood": {
49
+ "p": 0.9897197811,
50
+ "r": 0.9897197811,
51
+ "f": 0.9897197811
52
  },
53
  "Person": {
54
+ "p": 0.9991712707,
55
+ "r": 0.9991712707,
56
+ "f": 0.9991712707
57
  },
58
  "Tense": {
59
+ "p": 0.9973382133,
60
+ "r": 0.9973382133,
61
+ "f": 0.9973382133
62
  },
63
  "Reflex": {
64
  "p": 0.9976359338,
 
71
  "f": 1.0
72
  },
73
  "Foreign": {
74
+ "p": 0.7647058824,
75
+ "r": 0.1959798995,
76
+ "f": 0.312
77
  }
78
  },
79
+ "sents_p": 0.9779699403,
80
+ "sents_r": 0.9816077702,
81
+ "sents_f": 0.9797854785,
82
+ "dep_uas": 0.9592566441,
83
+ "dep_las": 0.9484326996,
84
  "dep_las_per_type": {
85
  "cp": {
86
+ "p": 0.9908256881,
87
+ "r": 0.987202925,
88
+ "f": 0.989010989
89
  },
90
  "nk": {
91
+ "p": 0.9891317621,
92
+ "r": 0.9895748493,
93
+ "f": 0.9893532561
94
  },
95
  "sb": {
96
+ "p": 0.9767034507,
97
  "r": 0.9780740221,
98
+ "f": 0.9773882559
99
  },
100
  "ag": {
101
+ "p": 0.9764125069,
102
+ "r": 0.9839690437,
103
+ "f": 0.9801762115
104
  },
105
  "mnr": {
106
+ "p": 0.8712352684,
107
+ "r": 0.8390079865,
108
+ "f": 0.8548179872
109
  },
110
  "mo": {
111
+ "p": 0.86918429,
112
+ "r": 0.8730528019,
113
+ "f": 0.8711142511
114
  },
115
  "oc": {
116
+ "p": 0.9640071986,
117
+ "r": 0.9674894642,
118
+ "f": 0.9657451923
119
  },
120
  "root": {
121
+ "p": 0.9857936998,
122
+ "r": 0.9894606324,
123
+ "f": 0.9876237624
124
  },
125
  "rc": {
126
+ "p": 0.8392857143,
127
+ "r": 0.8430493274,
128
+ "f": 0.841163311
129
  },
130
  "op": {
131
+ "p": 0.8259629101,
132
+ "r": 0.8628912072,
133
+ "f": 0.8440233236
134
  },
135
  "pm": {
136
  "p": 1.0,
 
138
  "f": 1.0
139
  },
140
  "nmc": {
141
+ "p": 0.9888178914,
142
+ "r": 0.9778830964,
143
+ "f": 0.9833200953
144
  },
145
  "oa": {
146
+ "p": 0.9628411707,
147
+ "r": 0.9656992084,
148
+ "f": 0.9642680718
149
  },
150
  "pd": {
151
+ "p": 0.9203125,
152
+ "r": 0.8661764706,
153
+ "f": 0.8924242424
154
  },
155
  "ep": {
156
+ "p": 0.9453125,
157
+ "r": 0.9097744361,
158
+ "f": 0.9272030651
159
  },
160
  "cd": {
161
+ "p": 0.9356499356,
162
+ "r": 0.9392764858,
163
+ "f": 0.9374597034
164
  },
165
  "cj": {
166
+ "p": 0.9112627986,
167
+ "r": 0.9215976331,
168
+ "f": 0.9164010787
169
  },
170
  "par": {
171
+ "p": 0.5279503106,
172
+ "r": 0.4166666667,
173
+ "f": 0.4657534247
174
  },
175
  "svp": {
176
+ "p": 0.9766990291,
177
+ "r": 0.9673076923,
178
+ "f": 0.9719806763
179
  },
180
  "pg": {
181
+ "p": 0.9220779221,
182
+ "r": 0.9044585987,
183
+ "f": 0.9131832797
184
  },
185
  "da": {
186
+ "p": 0.9153439153,
187
+ "r": 0.8804071247,
188
+ "f": 0.897535668
189
  },
190
  "app": {
191
+ "p": 0.81,
192
+ "r": 0.8181818182,
193
+ "f": 0.8140703518
194
  },
195
  "ac": {
196
+ "p": 0.9565217391,
197
+ "r": 0.9401709402,
198
+ "f": 0.9482758621
199
  },
200
  "pnc": {
201
+ "p": 0.9025710419,
202
  "r": 0.8662337662,
203
+ "f": 0.8840291584
204
  },
205
  "ju": {
206
+ "p": 0.93,
207
  "r": 0.9393939394,
208
+ "f": 0.9346733668
209
  },
210
  "ng": {
211
+ "p": 0.8839050132,
212
+ "r": 0.8909574468,
213
+ "f": 0.8874172185
214
  },
215
  "re": {
216
+ "p": 0.8224852071,
217
+ "r": 0.8273809524,
218
+ "f": 0.824925816
219
  },
220
  "dep": {
221
  "p": 0.0,
 
223
  "f": 0.0
224
  },
225
  "cm": {
226
+ "p": 0.9661835749,
227
+ "r": 0.9615384615,
228
+ "f": 0.9638554217
229
  },
230
  "cc": {
231
+ "p": 0.7759562842,
232
+ "r": 0.7135678392,
233
+ "f": 0.7434554974
234
  },
235
  "sbp": {
236
+ "p": 0.9734513274,
237
+ "r": 0.9482758621,
238
+ "f": 0.96069869
239
  },
240
  "uc": {
241
+ "p": 0.7619047619,
242
+ "r": 0.5333333333,
243
+ "f": 0.6274509804
244
  },
245
  "cvc": {
246
+ "p": 0.8157894737,
247
+ "r": 0.7848101266,
248
  "f": 0.8
249
  },
250
  "ams": {
251
+ "p": 0.75,
252
+ "r": 0.8823529412,
253
+ "f": 0.8108108108
254
  },
255
  "rs": {
256
+ "p": 0.7777777778,
257
  "r": 0.4516129032,
258
+ "f": 0.5714285714
259
  },
260
  "ph": {
261
+ "p": 0.8333333333,
262
+ "r": 0.7142857143,
263
+ "f": 0.7692307692
264
  },
265
  "dm": {
266
  "p": 1.0,
 
278
  "f": 0.0
279
  },
280
  "og": {
281
+ "p": 0.4166666667,
282
  "r": 0.7142857143,
283
+ "f": 0.5263157895
284
  },
285
  "avc": {
286
  "p": 0.0,
 
293
  "f": 0.8571428571
294
  }
295
  },
296
+ "lemma_acc": 0.9872611465,
297
+ "speed": 2933.9454548672
298
  }
config.cfg CHANGED
@@ -47,6 +47,7 @@ pooling = {"@layers":"reduce_mean.v1"}
47
  [components.morphologizer]
48
  factory = "morphologizer"
49
  extend = false
 
50
  overwrite = true
51
  scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
52
 
@@ -86,6 +87,7 @@ pooling = {"@layers":"reduce_mean.v1"}
86
 
87
  [components.tagger]
88
  factory = "tagger"
 
89
  neg_prefix = "!"
90
  overwrite = false
91
  scorer = {"@scorers":"spacy.tagger_scorer.v1"}
@@ -107,8 +109,8 @@ max_batch_items = 4096
107
  set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
108
 
109
  [components.transformer.model]
110
- @architectures = "spacy-transformers.TransformerModel.v3"
111
  name = "bert-base-german-cased"
 
112
  mixed_precision = false
113
 
114
  [components.transformer.model.get_spans]
 
47
  [components.morphologizer]
48
  factory = "morphologizer"
49
  extend = false
50
+ label_smoothing = 0.0
51
  overwrite = true
52
  scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
53
 
 
87
 
88
  [components.tagger]
89
  factory = "tagger"
90
+ label_smoothing = 0.0
91
  neg_prefix = "!"
92
  overwrite = false
93
  scorer = {"@scorers":"spacy.tagger_scorer.v1"}
 
109
  set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
110
 
111
  [components.transformer.model]
 
112
  name = "bert-base-german-cased"
113
+ @architectures = "spacy-transformers.TransformerModel.v3"
114
  mixed_precision = false
115
 
116
  [components.transformer.model.get_spans]
de_dep_news_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4610d0f969bbb3aec37ab4bf935b0902695405025fce141e2246a75dab2f7c63
3
- size 412823460
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7a018eb23ae715bbb44ae42f533d31a8f5083c13762899ba2d4b7ef424ad5d0
3
+ size 412822128
lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39be23b7e998b2032c44e0bf9d22ff3791f50c891e4b97794ad17b4f83747f59
3
  size 3977921
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9635c87e56e769c00e07ac0ec8518e913ba6a21fc4b9bbd06b49c89132289692
3
  size 3977921
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"de",
3
  "name":"dep_news_trf",
4
- "version":"3.5.0",
5
  "description":"German transformer pipeline (bert-base-german-cased). Components: transformer, tagger, morphologizer, parser, lemmatizer (trainable_lemmatizer).",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
- "spacy_version":">=3.5.0,<3.6.0",
11
- "spacy_git_version":"9e0322de1",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -819,62 +819,62 @@
819
  "token_p":0.9991808044,
820
  "token_r":0.9990356034,
821
  "token_f":0.9991081986,
822
- "tag_acc":0.990643584,
823
- "pos_acc":0.9915288956,
824
- "morph_acc":0.9699941191,
825
- "morph_micro_p":0.9883140406,
826
- "morph_micro_r":0.9886871127,
827
- "morph_micro_f":0.9885005414,
828
  "morph_per_feat":{
829
  "Case":{
830
- "p":0.9764129352,
831
- "r":0.9784679312,
832
- "f":0.9774393531
833
  },
834
  "Definite":{
835
- "p":0.9996579247,
836
- "r":0.9998859489,
837
- "f":0.9997719238
838
  },
839
  "Gender":{
840
- "p":0.9838005353,
841
- "r":0.9855497855,
842
- "f":0.9846743835
843
  },
844
  "Number":{
845
- "p":0.9914020247,
846
- "r":0.9936066713,
847
- "f":0.9925031237
848
  },
849
  "PronType":{
850
- "p":0.9982144306,
851
- "r":0.9972431687,
852
- "f":0.9977285633
853
  },
854
  "Degree":{
855
- "p":0.995600915,
856
- "r":0.9876069122,
857
- "f":0.9915878023
858
  },
859
  "VerbForm":{
860
- "p":0.9951794322,
861
- "r":0.9975303339,
862
- "f":0.9963534964
863
  },
864
  "Mood":{
865
- "p":0.9903893952,
866
- "r":0.991046261,
867
- "f":0.9907177192
868
  },
869
  "Person":{
870
- "p":0.9988956378,
871
- "r":0.9994475138,
872
- "f":0.9991714996
873
  },
874
  "Tense":{
875
- "p":0.9970074813,
876
- "r":0.9976709366,
877
- "f":0.9973390986
878
  },
879
  "Reflex":{
880
  "p":0.9976359338,
@@ -887,66 +887,66 @@
887
  "f":1.0
888
  },
889
  "Foreign":{
890
- "p":0.7916666667,
891
- "r":0.1909547739,
892
- "f":0.3076923077
893
  }
894
  },
895
- "sents_p":0.9826446281,
896
- "sents_r":0.9828476958,
897
- "sents_f":0.9827461515,
898
- "dep_uas":0.9593756103,
899
- "dep_las":0.9480405339,
900
  "dep_las_per_type":{
901
  "cp":{
902
- "p":0.9926605505,
903
- "r":0.9890310786,
904
- "f":0.9908424908
905
  },
906
  "nk":{
907
- "p":0.9882434302,
908
- "r":0.9892897866,
909
- "f":0.9887663316
910
  },
911
  "sb":{
912
- "p":0.9784172662,
913
  "r":0.9780740221,
914
- "f":0.978245614
915
  },
916
  "ag":{
917
- "p":0.9753018661,
918
- "r":0.9823106689,
919
- "f":0.9787937207
920
  },
921
  "mnr":{
922
- "p":0.8681462141,
923
- "r":0.8385876419,
924
- "f":0.8531109686
925
  },
926
  "mo":{
927
- "p":0.8696529459,
928
- "r":0.8719401173,
929
- "f":0.8707950298
930
  },
931
  "oc":{
932
- "p":0.961423445,
933
- "r":0.9677904877,
934
- "f":0.9645964596
935
  },
936
  "root":{
937
- "p":0.9894628099,
938
- "r":0.9896672866,
939
- "f":0.9895650377
940
  },
941
  "rc":{
942
- "p":0.8440979955,
943
- "r":0.8497757848,
944
- "f":0.8469273743
945
  },
946
  "op":{
947
- "p":0.8141843972,
948
- "r":0.8554396423,
949
- "f":0.8343023256
950
  },
951
  "pm":{
952
  "p":1.0,
@@ -954,84 +954,84 @@
954
  "f":1.0
955
  },
956
  "nmc":{
957
- "p":0.9872611465,
958
- "r":0.9794628752,
959
- "f":0.9833465504
960
  },
961
  "oa":{
962
- "p":0.965085639,
963
- "r":0.9663588391,
964
- "f":0.9657218194
965
  },
966
  "pd":{
967
- "p":0.9118110236,
968
- "r":0.8514705882,
969
- "f":0.880608365
970
  },
971
  "ep":{
972
- "p":0.9393939394,
973
- "r":0.9323308271,
974
- "f":0.9358490566
975
  },
976
  "cd":{
977
- "p":0.9336340206,
978
- "r":0.9360465116,
979
- "f":0.9348387097
980
  },
981
  "cj":{
982
- "p":0.9113060429,
983
- "r":0.9220907298,
984
- "f":0.9166666667
985
  },
986
  "par":{
987
- "p":0.5454545455,
988
- "r":0.4117647059,
989
- "f":0.469273743
990
  },
991
  "svp":{
992
- "p":0.9727626459,
993
- "r":0.9615384615,
994
- "f":0.9671179884
995
  },
996
  "pg":{
997
- "p":0.9140127389,
998
- "r":0.9140127389,
999
- "f":0.9140127389
1000
  },
1001
  "da":{
1002
- "p":0.9214659686,
1003
- "r":0.8956743003,
1004
- "f":0.9083870968
1005
  },
1006
  "app":{
1007
- "p":0.8052805281,
1008
- "r":0.8215488215,
1009
- "f":0.8133333333
1010
  },
1011
  "ac":{
1012
- "p":0.972972973,
1013
- "r":0.9230769231,
1014
- "f":0.9473684211
1015
  },
1016
  "pnc":{
1017
- "p":0.9001349528,
1018
  "r":0.8662337662,
1019
- "f":0.8828590338
1020
  },
1021
  "ju":{
1022
- "p":0.9117647059,
1023
  "r":0.9393939394,
1024
- "f":0.9253731343
1025
  },
1026
  "ng":{
1027
- "p":0.8710526316,
1028
- "r":0.8803191489,
1029
- "f":0.8756613757
1030
  },
1031
  "re":{
1032
- "p":0.8117647059,
1033
- "r":0.8214285714,
1034
- "f":0.8165680473
1035
  },
1036
  "dep":{
1037
  "p":0.0,
@@ -1039,44 +1039,44 @@
1039
  "f":0.0
1040
  },
1041
  "cm":{
1042
- "p":0.9565217391,
1043
- "r":0.9519230769,
1044
- "f":0.9542168675
1045
  },
1046
  "cc":{
1047
- "p":0.7837837838,
1048
- "r":0.7286432161,
1049
- "f":0.7552083333
1050
  },
1051
  "sbp":{
1052
- "p":0.963963964,
1053
- "r":0.9224137931,
1054
- "f":0.9427312775
1055
  },
1056
  "uc":{
1057
- "p":0.6818181818,
1058
- "r":0.5,
1059
- "f":0.5769230769
1060
  },
1061
  "cvc":{
1062
- "p":0.7901234568,
1063
- "r":0.8101265823,
1064
  "f":0.8
1065
  },
1066
  "ams":{
1067
- "p":0.7948717949,
1068
- "r":0.9117647059,
1069
- "f":0.8493150685
1070
  },
1071
  "rs":{
1072
- "p":0.8235294118,
1073
  "r":0.4516129032,
1074
- "f":0.5833333333
1075
  },
1076
  "ph":{
1077
- "p":0.8571428571,
1078
- "r":0.8571428571,
1079
- "f":0.8571428571
1080
  },
1081
  "dm":{
1082
  "p":1.0,
@@ -1094,9 +1094,9 @@
1094
  "f":0.0
1095
  },
1096
  "og":{
1097
- "p":0.4545454545,
1098
  "r":0.7142857143,
1099
- "f":0.5555555556
1100
  },
1101
  "avc":{
1102
  "p":0.0,
@@ -1109,8 +1109,8 @@
1109
  "f":0.8571428571
1110
  }
1111
  },
1112
- "lemma_acc":0.9873800777,
1113
- "speed":5858.0470519607
1114
  },
1115
  "sources":[
1116
  {
@@ -1133,6 +1133,6 @@
1133
  }
1134
  ],
1135
  "requirements":[
1136
- "spacy-transformers>=1.2.0.dev0,<1.3.0"
1137
  ]
1138
  }
 
1
  {
2
  "lang":"de",
3
  "name":"dep_news_trf",
4
+ "version":"3.6.1",
5
  "description":"German transformer pipeline (bert-base-german-cased). Components: transformer, tagger, morphologizer, parser, lemmatizer (trainable_lemmatizer).",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
+ "spacy_version":">=3.6.0,<3.7.0",
11
+ "spacy_git_version":"c067b5264",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
819
  "token_p":0.9991808044,
820
  "token_r":0.9990356034,
821
  "token_f":0.9991081986,
822
+ "tag_acc":0.9905775076,
823
+ "pos_acc":0.9914628183,
824
+ "morph_acc":0.9700866279,
825
+ "morph_micro_p":0.9886266605,
826
+ "morph_micro_r":0.9884199706,
827
+ "morph_micro_f":0.9885233048,
828
  "morph_per_feat":{
829
  "Case":{
830
+ "p":0.9763482571,
831
+ "r":0.9779552629,
832
+ "f":0.9771510993
833
  },
834
  "Definite":{
835
+ "p":0.9996579637,
836
+ "r":1.0,
837
+ "f":0.9998289526
838
  },
839
  "Gender":{
840
+ "p":0.9848792598,
841
+ "r":0.9853240009,
842
+ "f":0.9851015801
843
  },
844
  "Number":{
845
+ "p":0.9918825162,
846
+ "r":0.9934908501,
847
+ "f":0.9926860317
848
  },
849
  "PronType":{
850
+ "p":0.9982142857,
851
+ "r":0.9971620855,
852
+ "f":0.9976879082
853
  },
854
  "Degree":{
855
+ "p":0.9956001408,
856
+ "r":0.9874323617,
857
+ "f":0.9914994304
858
  },
859
  "VerbForm":{
860
+ "p":0.9950717806,
861
+ "r":0.9973155804,
862
+ "f":0.996192417
863
  },
864
  "Mood":{
865
+ "p":0.9897197811,
866
+ "r":0.9897197811,
867
+ "f":0.9897197811
868
  },
869
  "Person":{
870
+ "p":0.9991712707,
871
+ "r":0.9991712707,
872
+ "f":0.9991712707
873
  },
874
  "Tense":{
875
+ "p":0.9973382133,
876
+ "r":0.9973382133,
877
+ "f":0.9973382133
878
  },
879
  "Reflex":{
880
  "p":0.9976359338,
 
887
  "f":1.0
888
  },
889
  "Foreign":{
890
+ "p":0.7647058824,
891
+ "r":0.1959798995,
892
+ "f":0.312
893
  }
894
  },
895
+ "sents_p":0.9779699403,
896
+ "sents_r":0.9816077702,
897
+ "sents_f":0.9797854785,
898
+ "dep_uas":0.9592566441,
899
+ "dep_las":0.9484326996,
900
  "dep_las_per_type":{
901
  "cp":{
902
+ "p":0.9908256881,
903
+ "r":0.987202925,
904
+ "f":0.989010989
905
  },
906
  "nk":{
907
+ "p":0.9891317621,
908
+ "r":0.9895748493,
909
+ "f":0.9893532561
910
  },
911
  "sb":{
912
+ "p":0.9767034507,
913
  "r":0.9780740221,
914
+ "f":0.9773882559
915
  },
916
  "ag":{
917
+ "p":0.9764125069,
918
+ "r":0.9839690437,
919
+ "f":0.9801762115
920
  },
921
  "mnr":{
922
+ "p":0.8712352684,
923
+ "r":0.8390079865,
924
+ "f":0.8548179872
925
  },
926
  "mo":{
927
+ "p":0.86918429,
928
+ "r":0.8730528019,
929
+ "f":0.8711142511
930
  },
931
  "oc":{
932
+ "p":0.9640071986,
933
+ "r":0.9674894642,
934
+ "f":0.9657451923
935
  },
936
  "root":{
937
+ "p":0.9857936998,
938
+ "r":0.9894606324,
939
+ "f":0.9876237624
940
  },
941
  "rc":{
942
+ "p":0.8392857143,
943
+ "r":0.8430493274,
944
+ "f":0.841163311
945
  },
946
  "op":{
947
+ "p":0.8259629101,
948
+ "r":0.8628912072,
949
+ "f":0.8440233236
950
  },
951
  "pm":{
952
  "p":1.0,
 
954
  "f":1.0
955
  },
956
  "nmc":{
957
+ "p":0.9888178914,
958
+ "r":0.9778830964,
959
+ "f":0.9833200953
960
  },
961
  "oa":{
962
+ "p":0.9628411707,
963
+ "r":0.9656992084,
964
+ "f":0.9642680718
965
  },
966
  "pd":{
967
+ "p":0.9203125,
968
+ "r":0.8661764706,
969
+ "f":0.8924242424
970
  },
971
  "ep":{
972
+ "p":0.9453125,
973
+ "r":0.9097744361,
974
+ "f":0.9272030651
975
  },
976
  "cd":{
977
+ "p":0.9356499356,
978
+ "r":0.9392764858,
979
+ "f":0.9374597034
980
  },
981
  "cj":{
982
+ "p":0.9112627986,
983
+ "r":0.9215976331,
984
+ "f":0.9164010787
985
  },
986
  "par":{
987
+ "p":0.5279503106,
988
+ "r":0.4166666667,
989
+ "f":0.4657534247
990
  },
991
  "svp":{
992
+ "p":0.9766990291,
993
+ "r":0.9673076923,
994
+ "f":0.9719806763
995
  },
996
  "pg":{
997
+ "p":0.9220779221,
998
+ "r":0.9044585987,
999
+ "f":0.9131832797
1000
  },
1001
  "da":{
1002
+ "p":0.9153439153,
1003
+ "r":0.8804071247,
1004
+ "f":0.897535668
1005
  },
1006
  "app":{
1007
+ "p":0.81,
1008
+ "r":0.8181818182,
1009
+ "f":0.8140703518
1010
  },
1011
  "ac":{
1012
+ "p":0.9565217391,
1013
+ "r":0.9401709402,
1014
+ "f":0.9482758621
1015
  },
1016
  "pnc":{
1017
+ "p":0.9025710419,
1018
  "r":0.8662337662,
1019
+ "f":0.8840291584
1020
  },
1021
  "ju":{
1022
+ "p":0.93,
1023
  "r":0.9393939394,
1024
+ "f":0.9346733668
1025
  },
1026
  "ng":{
1027
+ "p":0.8839050132,
1028
+ "r":0.8909574468,
1029
+ "f":0.8874172185
1030
  },
1031
  "re":{
1032
+ "p":0.8224852071,
1033
+ "r":0.8273809524,
1034
+ "f":0.824925816
1035
  },
1036
  "dep":{
1037
  "p":0.0,
 
1039
  "f":0.0
1040
  },
1041
  "cm":{
1042
+ "p":0.9661835749,
1043
+ "r":0.9615384615,
1044
+ "f":0.9638554217
1045
  },
1046
  "cc":{
1047
+ "p":0.7759562842,
1048
+ "r":0.7135678392,
1049
+ "f":0.7434554974
1050
  },
1051
  "sbp":{
1052
+ "p":0.9734513274,
1053
+ "r":0.9482758621,
1054
+ "f":0.96069869
1055
  },
1056
  "uc":{
1057
+ "p":0.7619047619,
1058
+ "r":0.5333333333,
1059
+ "f":0.6274509804
1060
  },
1061
  "cvc":{
1062
+ "p":0.8157894737,
1063
+ "r":0.7848101266,
1064
  "f":0.8
1065
  },
1066
  "ams":{
1067
+ "p":0.75,
1068
+ "r":0.8823529412,
1069
+ "f":0.8108108108
1070
  },
1071
  "rs":{
1072
+ "p":0.7777777778,
1073
  "r":0.4516129032,
1074
+ "f":0.5714285714
1075
  },
1076
  "ph":{
1077
+ "p":0.8333333333,
1078
+ "r":0.7142857143,
1079
+ "f":0.7692307692
1080
  },
1081
  "dm":{
1082
  "p":1.0,
 
1094
  "f":0.0
1095
  },
1096
  "og":{
1097
+ "p":0.4166666667,
1098
  "r":0.7142857143,
1099
+ "f":0.5263157895
1100
  },
1101
  "avc":{
1102
  "p":0.0,
 
1109
  "f":0.8571428571
1110
  }
1111
  },
1112
+ "lemma_acc":0.9872611465,
1113
+ "speed":2933.9454548672
1114
  },
1115
  "sources":[
1116
  {
 
1133
  }
1134
  ],
1135
  "requirements":[
1136
+ "spacy-transformers>=1.2.2,<1.3.0"
1137
  ]
1138
  }
morphologizer/cfg CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "extend":false,
 
3
  "labels_morph":{
4
  "POS=PUNCT":"",
5
  "Case=Nom|Gender=Masc|Number=Sing|POS=PROPN":"Case=Nom|Gender=Masc|Number=Sing",
 
1
  {
2
  "extend":false,
3
+ "label_smoothing":0.0,
4
  "labels_morph":{
5
  "POS=PUNCT":"",
6
  "Case=Nom|Gender=Masc|Number=Sing|POS=PROPN":"Case=Nom|Gender=Masc|Number=Sing",
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcd0b37e93a4ed1273e678c6c8556930c642765dd4295f3b49d079162e734cbd
3
  size 2061573
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dafaa8f2141aba369eb18c3a6727746f13ecc43c975715c65fa0be05f6d65e82
3
  size 2061573
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cb7719cbc056b58d3e19a480625af6451b7eef6f456580f69394703d0e2ffb3
3
  size 768761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eec7f88b6a5e5244ba4ea9f103c1e7ca70c45bbb6406e5d0b12d9d2c4c06dfe
3
  size 768761
tagger/cfg CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "labels":[
3
  "$(",
4
  "$,",
 
1
  {
2
+ "label_smoothing":0.0,
3
  "labels":[
4
  "$(",
5
  "$,",
tagger/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c81a3419f48cb52dbfdc99f1aeec6c51084dcf73ceed0e5d87eee7ee853bf3ab
3
  size 166746
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbbb191c59d892fc8135e553b55f152dd944d3f8d57f678b05e8f2a4d018063b
3
  size 166746
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:532a2d9bd48648667d6b93ba75188118f8f5e8f166adb802a925d85a5a904828
3
- size 437388334
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef8c2744ef38035601218e95c13856630fccd542cd509f3bf474ed63e28dc44f
3
+ size 437388252
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:799d2cddc3be0264980ae3de66edd48b8e0cebd216c5d94f458aa07bf02a0c96
3
- size 3040576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a2bd3d2d62b594c5a1859c8a4a86a3cc82b314b27c93e5859aad8503a45455
3
+ size 3040776