adrianeboyd commited on
Commit
7381706
1 Parent(s): ed3a84e

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,62 +14,62 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.9520121233
18
  - name: NER Recall
19
  type: recall
20
- value: 0.9516916344
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.9518518519
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
- value: 0.9889933439
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
- value: 0.9889933439
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
- value: 0.9747833538
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
- value: 2.15292e-05
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
- value: 0.9630346126
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
- value: 0.9520673253
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
- value: 0.9987634357
73
  ---
74
  ### Details: https://spacy.io/models/ru#ru_core_news_lg
75
 
@@ -78,8 +78,8 @@ Russian pipeline optimized for CPU. Components: tok2vec, morphologizer, parser,
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `ru_core_news_lg` |
81
- | **Version** | `3.4.0` |
82
- | **spaCy** | `>=3.4.0,<3.5.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `senter`, `attribute_ruler`, `lemmatizer`, `ner` |
85
  | **Vectors** | 500002 keys, 500002 unique vectors (300 dimensions) |
@@ -105,22 +105,22 @@ Russian pipeline optimized for CPU. Components: tok2vec, morphologizer, parser,
105
 
106
  | Type | Score |
107
  | --- | --- |
108
- | `TOKEN_ACC` | 99.84 |
109
  | `TOKEN_P` | 97.28 |
110
- | `TOKEN_R` | 98.32 |
111
  | `TOKEN_F` | 97.79 |
112
- | `POS_ACC` | 98.90 |
113
- | `MORPH_ACC` | 97.48 |
114
  | `MORPH_MICRO_P` | 98.97 |
115
- | `MORPH_MICRO_R` | 98.33 |
116
- | `MORPH_MICRO_F` | 98.65 |
117
  | `SENTS_P` | 99.87 |
118
- | `SENTS_R` | 99.89 |
119
- | `SENTS_F` | 99.88 |
120
- | `DEP_UAS` | 96.30 |
121
- | `DEP_LAS` | 95.21 |
122
- | `TAG_ACC` | 98.90 |
123
  | `LEMMA_ACC` | 0.00 |
124
- | `ENTS_P` | 95.20 |
125
- | `ENTS_R` | 95.17 |
126
- | `ENTS_F` | 95.19 |
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.9524209818
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.9535431745
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.9529817478
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.989280677
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
+ value: 0.989280677
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
+ value: 0.9749177029
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
+ value: 2.15295e-05
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
+ value: 0.962198055
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
+ value: 0.9511948091
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
+ value: 0.9985729236
73
  ---
74
  ### Details: https://spacy.io/models/ru#ru_core_news_lg
75
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `ru_core_news_lg` |
81
+ | **Version** | `3.5.0` |
82
+ | **spaCy** | `>=3.5.0,<3.6.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `senter`, `attribute_ruler`, `lemmatizer`, `ner` |
85
  | **Vectors** | 500002 keys, 500002 unique vectors (300 dimensions) |
105
 
106
  | Type | Score |
107
  | --- | --- |
108
+ | `TOKEN_ACC` | 99.68 |
109
  | `TOKEN_P` | 97.28 |
110
+ | `TOKEN_R` | 98.31 |
111
  | `TOKEN_F` | 97.79 |
112
+ | `POS_ACC` | 98.93 |
113
+ | `MORPH_ACC` | 97.49 |
114
  | `MORPH_MICRO_P` | 98.97 |
115
+ | `MORPH_MICRO_R` | 98.30 |
116
+ | `MORPH_MICRO_F` | 98.64 |
117
  | `SENTS_P` | 99.87 |
118
+ | `SENTS_R` | 99.85 |
119
+ | `SENTS_F` | 99.86 |
120
+ | `DEP_UAS` | 96.22 |
121
+ | `DEP_LAS` | 95.12 |
122
+ | `TAG_ACC` | 98.93 |
123
  | `LEMMA_ACC` | 0.00 |
124
+ | `ENTS_P` | 95.24 |
125
+ | `ENTS_R` | 95.35 |
126
+ | `ENTS_F` | 95.30 |
accuracy.json CHANGED
@@ -1,68 +1,68 @@
1
  {
2
- "token_acc": 0.9984047451,
3
- "token_p": 0.9727635194,
4
- "token_r": 0.9831678569,
5
- "token_f": 0.9779380158,
6
- "pos_acc": 0.9889933439,
7
- "morph_acc": 0.9747833538,
8
- "morph_micro_p": 0.9896991632,
9
- "morph_micro_r": 0.9832782178,
10
- "morph_micro_f": 0.9864782422,
11
  "morph_per_feat": {
12
  "Animacy": {
13
- "p": 0.9896970764,
14
- "r": 0.980088367,
15
- "f": 0.9848692858
16
  },
17
  "Case": {
18
- "p": 0.9789719626,
19
- "r": 0.9722662264,
20
- "f": 0.9756075718
21
  },
22
  "Gender": {
23
- "p": 0.9880955025,
24
- "r": 0.9819453948,
25
- "f": 0.9850108489
26
  },
27
  "Number": {
28
- "p": 0.9960197873,
29
- "r": 0.9897728557,
30
- "f": 0.9928864957
31
  },
32
  "Degree": {
33
- "p": 0.9885778967,
34
- "r": 0.9863449692,
35
- "f": 0.9874601706
36
  },
37
  "Aspect": {
38
- "p": 0.9905277402,
39
- "r": 0.9869662921,
40
- "f": 0.9887438091
41
  },
42
  "Mood": {
43
- "p": 0.9986340494,
44
- "r": 0.9970245475,
45
- "f": 0.9978286494
46
  },
47
  "Tense": {
48
- "p": 0.9932989691,
49
- "r": 0.9896261298,
50
- "f": 0.991459148
51
  },
52
  "VerbForm": {
53
- "p": 0.9952187641,
54
- "r": 0.9916404494,
55
- "f": 0.9934263845
56
  },
57
  "Voice": {
58
- "p": 0.9910690122,
59
- "r": 0.987505618,
60
- "f": 0.9892841063
61
  },
62
  "StyleVariant": {
63
- "p": 0.9931170108,
64
- "r": 0.9960552268,
65
- "f": 0.9945839488
66
  },
67
  "Polarity": {
68
  "p": 1.0,
@@ -70,14 +70,14 @@
70
  "f": 1.0
71
  },
72
  "Person": {
73
- "p": 0.9997729852,
74
- "r": 0.9934581547,
75
- "f": 0.9966055669
76
  },
77
  "Foreign": {
78
- "p": 0.9700483092,
79
- "r": 0.8685121107,
80
- "f": 0.9164764948
81
  },
82
  "Hyph": {
83
  "p": 0.0,
@@ -85,186 +85,186 @@
85
  "f": 0.0
86
  }
87
  },
88
- "sents_p": 0.9986684421,
89
- "sents_r": 0.9988584475,
90
- "sents_f": 0.9987634357,
91
- "dep_uas": 0.9630346126,
92
- "dep_las": 0.9520673253,
93
  "dep_las_per_type": {
94
  "case": {
95
- "p": 0.9938650307,
96
- "r": 0.9893826928,
97
- "f": 0.9916187965
98
  },
99
  "parataxis": {
100
- "p": 0.878342246,
101
- "r": 0.8499353169,
102
- "f": 0.8639053254
103
  },
104
  "nmod": {
105
- "p": 0.9342683497,
106
- "r": 0.9280208043,
107
- "f": 0.9311340975
108
  },
109
  "advmod": {
110
- "p": 0.9611451943,
111
- "r": 0.9530246705,
112
- "f": 0.9570677074
113
  },
114
  "obl": {
115
- "p": 0.9446489434,
116
- "r": 0.9377452971,
117
- "f": 0.9411844607
118
  },
119
  "amod": {
120
- "p": 0.9890609462,
121
- "r": 0.9844457014,
122
- "f": 0.9867479271
123
  },
124
  "nsubj": {
125
- "p": 0.9695295232,
126
- "r": 0.9696826149,
127
- "f": 0.969606063
128
  },
129
  "root": {
130
- "p": 0.9899066844,
131
- "r": 0.9889649924,
132
- "f": 0.9894356144
133
  },
134
  "xcomp": {
135
- "p": 0.9630188679,
136
- "r": 0.9696048632,
137
- "f": 0.9663006437
138
  },
139
  "conj": {
140
- "p": 0.8997961957,
141
- "r": 0.9090597117,
142
- "f": 0.9044042335
143
  },
144
  "cc": {
145
- "p": 0.9761235955,
146
- "r": 0.9752104771,
147
- "f": 0.9756668226
148
  },
149
  "fixed": {
150
- "p": 0.9860228717,
151
- "r": 0.9872773537,
152
- "f": 0.9866497139
153
  },
154
  "mark": {
155
- "p": 0.9674690956,
156
- "r": 0.9706266319,
157
- "f": 0.9690452916
158
  },
159
  "ccomp": {
160
- "p": 0.976016684,
161
- "r": 0.9790794979,
162
- "f": 0.9775456919
163
  },
164
  "nummod:gov": {
165
- "p": 0.9726315789,
166
- "r": 0.9625,
167
- "f": 0.967539267
168
  },
169
  "nummod": {
170
- "p": 0.9629310345,
171
- "r": 0.9482173175,
172
- "f": 0.9555175364
173
  },
174
  "obj": {
175
- "p": 0.9708791209,
176
- "r": 0.9655737705,
177
- "f": 0.9682191781
178
  },
179
  "det": {
180
- "p": 0.9680696662,
181
- "r": 0.9638728324,
182
- "f": 0.9659666908
183
  },
184
  "appos": {
185
- "p": 0.8946873531,
186
- "r": 0.8174398625,
187
- "f": 0.8543209877
188
  },
189
  "aux": {
190
- "p": 0.9714285714,
191
- "r": 0.9714285714,
192
- "f": 0.9714285714
193
  },
194
  "flat": {
195
- "p": 0.9952718676,
196
- "r": 0.9589977221,
197
- "f": 0.9767981439
198
  },
199
  "flat:name": {
200
- "p": 0.976016684,
201
- "r": 0.9669421488,
202
- "f": 0.9714582252
203
  },
204
  "iobj": {
205
- "p": 0.9184782609,
206
- "r": 0.8492462312,
207
- "f": 0.8825065274
208
  },
209
  "acl": {
210
- "p": 0.9164524422,
211
- "r": 0.8901373283,
212
- "f": 0.9031032299
213
  },
214
  "obl:agent": {
215
- "p": 0.7125,
216
- "r": 0.75,
217
- "f": 0.7307692308
218
  },
219
  "advcl": {
220
- "p": 0.8886310905,
221
  "r": 0.8744292237,
222
- "f": 0.8814729574
223
  },
224
  "cop": {
225
- "p": 0.9361702128,
226
- "r": 0.9166666667,
227
- "f": 0.9263157895
228
  },
229
  "flat:foreign": {
230
- "p": 0.949602122,
231
- "r": 0.8136363636,
232
- "f": 0.876376989
233
  },
234
  "aux:pass": {
235
- "p": 0.9884393064,
236
- "r": 0.9799426934,
237
- "f": 0.9841726619
238
  },
239
  "nsubj:pass": {
240
- "p": 0.9588235294,
241
- "r": 0.9518248175,
242
- "f": 0.9553113553
243
  },
244
  "acl:relcl": {
245
- "p": 0.8252631579,
246
- "r": 0.8049281314,
247
- "f": 0.814968815
248
  },
249
  "orphan": {
250
- "p": 0.78125,
251
  "r": 0.6944444444,
252
- "f": 0.7352941176
253
  },
254
  "discourse": {
255
- "p": 0.75,
256
- "r": 0.9230769231,
257
- "f": 0.8275862069
258
  },
259
  "csubj": {
260
- "p": 0.9705882353,
261
- "r": 0.9295774648,
262
- "f": 0.9496402878
263
  },
264
  "expl": {
265
- "p": 0.7894736842,
266
  "r": 0.7894736842,
267
- "f": 0.7894736842
268
  },
269
  "compound": {
270
  "p": 1.0,
@@ -272,9 +272,9 @@
272
  "f": 0.4615384615
273
  },
274
  "csubj:pass": {
275
- "p": 0.9,
276
  "r": 0.8181818182,
277
- "f": 0.8571428571
278
  },
279
  "nummod:entity": {
280
  "p": 1.0,
@@ -287,27 +287,27 @@
287
  "f": 0.0
288
  }
289
  },
290
- "tag_acc": 0.9889933439,
291
- "lemma_acc": 2.15292e-05,
292
- "ents_p": 0.9520121233,
293
- "ents_r": 0.9516916344,
294
- "ents_f": 0.9518518519,
295
  "ents_per_type": {
296
  "PER": {
297
- "p": 0.9595278246,
298
- "r": 0.9584503088,
299
- "f": 0.958988764
300
  },
301
  "LOC": {
302
- "p": 0.9754485364,
303
- "r": 0.9759093056,
304
- "f": 0.9756788666
305
  },
306
  "ORG": {
307
- "p": 0.9211557297,
308
- "r": 0.9207048458,
309
- "f": 0.9209302326
310
  }
311
  },
312
- "speed": 3393.7960657989
313
  }
1
  {
2
+ "token_acc": 0.9968038482,
3
+ "token_p": 0.9727525387,
4
+ "token_r": 0.9831462495,
5
+ "token_f": 0.9779217779,
6
+ "pos_acc": 0.989280677,
7
+ "morph_acc": 0.9749177029,
8
+ "morph_micro_p": 0.9897327316,
9
+ "morph_micro_r": 0.9829975554,
10
+ "morph_micro_f": 0.9863536461,
11
  "morph_per_feat": {
12
  "Animacy": {
13
+ "p": 0.9905472053,
14
+ "r": 0.9808150689,
15
+ "f": 0.9856571145
16
  },
17
  "Case": {
18
+ "p": 0.9776694449,
19
+ "r": 0.9709944443,
20
+ "f": 0.9743205122
21
  },
22
  "Gender": {
23
+ "p": 0.9884699976,
24
+ "r": 0.982055753,
25
+ "f": 0.9852524358
26
  },
27
  "Number": {
28
+ "p": 0.9958673769,
29
+ "r": 0.9894338343,
30
+ "f": 0.9926401814
31
  },
32
  "Degree": {
33
+ "p": 0.9884927566,
34
+ "r": 0.9877823409,
35
+ "f": 0.988137421
36
  },
37
  "Aspect": {
38
+ "p": 0.9913263462,
39
+ "r": 0.986247191,
40
+ "f": 0.988780246
41
  },
42
  "Mood": {
43
+ "p": 0.9990060877,
44
+ "r": 0.9969005703,
45
+ "f": 0.9979522184
46
  },
47
  "Tense": {
48
+ "p": 0.99442264,
49
+ "r": 0.9889071487,
50
+ "f": 0.9916572253
51
  },
52
  "VerbForm": {
53
+ "p": 0.9958438742,
54
+ "r": 0.990741573,
55
+ "f": 0.9932861713
56
  },
57
  "Voice": {
58
+ "p": 0.9914166968,
59
+ "r": 0.9863370787,
60
+ "f": 0.9888703645
61
  },
62
  "StyleVariant": {
63
+ "p": 0.989194499,
64
+ "r": 0.9930966469,
65
+ "f": 0.9911417323
66
  },
67
  "Polarity": {
68
  "p": 1.0,
70
  "f": 1.0
71
  },
72
  "Person": {
73
+ "p": 0.9995459705,
74
+ "r": 0.9932325739,
75
+ "f": 0.9963792713
76
  },
77
  "Foreign": {
78
+ "p": 0.9711260828,
79
+ "r": 0.8728373702,
80
+ "f": 0.9193621868
81
  },
82
  "Hyph": {
83
  "p": 0.0,
85
  "f": 0.0
86
  }
87
  },
88
+ "sents_p": 0.9986679353,
89
+ "sents_r": 0.99847793,
90
+ "sents_f": 0.9985729236,
91
+ "dep_uas": 0.962198055,
92
+ "dep_las": 0.9511948091,
93
  "dep_las_per_type": {
94
  "case": {
95
+ "p": 0.9918025064,
96
+ "r": 0.989006859,
97
+ "f": 0.9904027098
98
  },
99
  "parataxis": {
100
+ "p": 0.8842034806,
101
+ "r": 0.8544631307,
102
+ "f": 0.8690789474
103
  },
104
  "nmod": {
105
+ "p": 0.9328846513,
106
+ "r": 0.9269062877,
107
+ "f": 0.9298858607
108
  },
109
  "advmod": {
110
+ "p": 0.9554118448,
111
+ "r": 0.9486312944,
112
+ "f": 0.9520094964
113
  },
114
  "obl": {
115
+ "p": 0.9425224734,
116
+ "r": 0.9365272703,
117
+ "f": 0.9395153079
118
  },
119
  "amod": {
120
+ "p": 0.9893299189,
121
+ "r": 0.9833144796,
122
+ "f": 0.9863130274
123
  },
124
  "nsubj": {
125
+ "p": 0.9722486521,
126
+ "r": 0.9681035844,
127
+ "f": 0.9701716908
128
  },
129
  "root": {
130
+ "p": 0.9893313012,
131
+ "r": 0.9880136986,
132
+ "f": 0.9886720609
133
  },
134
  "xcomp": {
135
+ "p": 0.9570135747,
136
+ "r": 0.9642857143,
137
+ "f": 0.9606358819
138
  },
139
  "conj": {
140
+ "p": 0.8906144497,
141
+ "r": 0.9052848318,
142
+ "f": 0.8978897209
143
  },
144
  "cc": {
145
+ "p": 0.9746597841,
146
+ "r": 0.9714686623,
147
+ "f": 0.9730616069
148
  },
149
  "fixed": {
150
+ "p": 0.9835025381,
151
+ "r": 0.9860050891,
152
+ "f": 0.9847522236
153
  },
154
  "mark": {
155
+ "p": 0.9681197137,
156
+ "r": 0.9712793734,
157
+ "f": 0.9696969697
158
  },
159
  "ccomp": {
160
+ "p": 0.978125,
161
+ "r": 0.9822175732,
162
+ "f": 0.9801670146
163
  },
164
  "nummod:gov": {
165
+ "p": 0.9684210526,
166
+ "r": 0.9583333333,
167
+ "f": 0.9633507853
168
  },
169
  "nummod": {
170
+ "p": 0.9664948454,
171
+ "r": 0.955008489,
172
+ "f": 0.9607173356
173
  },
174
  "obj": {
175
+ "p": 0.9738364087,
176
+ "r": 0.9661202186,
177
+ "f": 0.969962968
178
  },
179
  "det": {
180
+ "p": 0.976,
181
+ "r": 0.9696531792,
182
+ "f": 0.9728162378
183
  },
184
  "appos": {
185
+ "p": 0.8951881848,
186
+ "r": 0.8071305842,
187
+ "f": 0.8488818613
188
  },
189
  "aux": {
190
+ "p": 0.9619047619,
191
+ "r": 0.9619047619,
192
+ "f": 0.9619047619
193
  },
194
  "flat": {
195
+ "p": 0.9929411765,
196
+ "r": 0.9612756264,
197
+ "f": 0.9768518519
198
  },
199
  "flat:name": {
200
+ "p": 0.9759665622,
201
+ "r": 0.9648760331,
202
+ "f": 0.9703896104
203
  },
204
  "iobj": {
205
+ "p": 0.9176788124,
206
+ "r": 0.8542713568,
207
+ "f": 0.8848405986
208
  },
209
  "acl": {
210
+ "p": 0.9232769831,
211
+ "r": 0.88639201,
212
+ "f": 0.9044585987
213
  },
214
  "obl:agent": {
215
+ "p": 0.7792207792,
216
+ "r": 0.7894736842,
217
+ "f": 0.7843137255
218
  },
219
  "advcl": {
220
+ "p": 0.8665158371,
221
  "r": 0.8744292237,
222
+ "f": 0.8704545455
223
  },
224
  "cop": {
225
+ "p": 0.9246575342,
226
+ "r": 0.9375,
227
+ "f": 0.9310344828
228
  },
229
  "flat:foreign": {
230
+ "p": 0.963060686,
231
+ "r": 0.8295454545,
232
+ "f": 0.8913308913
233
  },
234
  "aux:pass": {
235
+ "p": 0.9913294798,
236
+ "r": 0.9828080229,
237
+ "f": 0.9870503597
238
  },
239
  "nsubj:pass": {
240
+ "p": 0.9505813953,
241
+ "r": 0.9547445255,
242
+ "f": 0.9526584122
243
  },
244
  "acl:relcl": {
245
+ "p": 0.8177966102,
246
+ "r": 0.7926078029,
247
+ "f": 0.8050052138
248
  },
249
  "orphan": {
250
+ "p": 0.7352941176,
251
  "r": 0.6944444444,
252
+ "f": 0.7142857143
253
  },
254
  "discourse": {
255
+ "p": 0.9117647059,
256
+ "r": 0.9538461538,
257
+ "f": 0.9323308271
258
  },
259
  "csubj": {
260
+ "p": 0.964028777,
261
+ "r": 0.9436619718,
262
+ "f": 0.9537366548
263
  },
264
  "expl": {
265
+ "p": 0.8823529412,
266
  "r": 0.7894736842,
267
+ "f": 0.8333333333
268
  },
269
  "compound": {
270
  "p": 1.0,
272
  "f": 0.4615384615
273
  },
274
  "csubj:pass": {
275
+ "p": 0.8181818182,
276
  "r": 0.8181818182,
277
+ "f": 0.8181818182
278
  },
279
  "nummod:entity": {
280
  "p": 1.0,
287
  "f": 0.0
288
  }
289
  },
290
+ "tag_acc": 0.989280677,
291
+ "lemma_acc": 2.15295e-05,
292
+ "ents_p": 0.9524209818,
293
+ "ents_r": 0.9535431745,
294
+ "ents_f": 0.9529817478,
295
  "ents_per_type": {
296
  "PER": {
297
+ "p": 0.9641456583,
298
+ "r": 0.9663110612,
299
+ "f": 0.9652271453
300
  },
301
  "LOC": {
302
+ "p": 0.9740566038,
303
+ "r": 0.9754369391,
304
+ "f": 0.9747462827
305
  },
306
  "ORG": {
307
+ "p": 0.9197258933,
308
+ "r": 0.9197258933,
309
+ "f": 0.9197258933
310
  }
311
  },
312
+ "speed": 2459.2661417009
313
  }
attribute_ruler/patterns CHANGED
Binary files a/attribute_ruler/patterns and b/attribute_ruler/patterns differ
config.cfg CHANGED
@@ -27,7 +27,7 @@ validate = false
27
 
28
  [components.lemmatizer]
29
  factory = "lemmatizer"
30
- mode = "pymorphy2"
31
  model = null
32
  overwrite = false
33
  scorer = {"@scorers":"spacy.lemmatizer_scorer.v1"}
@@ -70,8 +70,8 @@ nO = null
70
  [components.ner.model.tok2vec.embed]
71
  @architectures = "spacy.MultiHashEmbed.v2"
72
  width = 96
73
- attrs = ["NORM","PREFIX","SUFFIX","SHAPE","SPACY"]
74
- rows = [5000,1000,2500,2500,50]
75
  include_static_vectors = true
76
 
77
  [components.ner.model.tok2vec.encode]
@@ -139,8 +139,8 @@ factory = "tok2vec"
139
  [components.tok2vec.model.embed]
140
  @architectures = "spacy.MultiHashEmbed.v2"
141
  width = ${components.tok2vec.model.encode:width}
142
- attrs = ["NORM","PREFIX","SUFFIX","SHAPE","SPACY"]
143
- rows = [5000,1000,2500,2500,50]
144
  include_static_vectors = true
145
 
146
  [components.tok2vec.model.encode]
@@ -182,6 +182,7 @@ eval_frequency = 1000
182
  frozen_components = []
183
  before_to_disk = null
184
  annotating_components = []
 
185
 
186
  [training.batcher]
187
  @batchers = "spacy.batch_by_words.v1"
27
 
28
  [components.lemmatizer]
29
  factory = "lemmatizer"
30
+ mode = "pymorphy3"
31
  model = null
32
  overwrite = false
33
  scorer = {"@scorers":"spacy.lemmatizer_scorer.v1"}
70
  [components.ner.model.tok2vec.embed]
71
  @architectures = "spacy.MultiHashEmbed.v2"
72
  width = 96
73
+ attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
74
+ rows = [5000,1000,2500,2500]
75
  include_static_vectors = true
76
 
77
  [components.ner.model.tok2vec.encode]
139
  [components.tok2vec.model.embed]
140
  @architectures = "spacy.MultiHashEmbed.v2"
141
  width = ${components.tok2vec.model.encode:width}
142
+ attrs = ["NORM","PREFIX","SUFFIX","SHAPE","SPACY","IS_SPACE"]
143
+ rows = [5000,1000,2500,2500,50,50]
144
  include_static_vectors = true
145
 
146
  [components.tok2vec.model.encode]
182
  frozen_components = []
183
  before_to_disk = null
184
  annotating_components = []
185
+ before_update = null
186
 
187
  [training.batcher]
188
  @batchers = "spacy.batch_by_words.v1"
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"ru",
3
  "name":"core_news_lg",
4
- "version":"3.4.0",
5
  "description":"Russian pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, senter, ner, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
- "spacy_version":">=3.4.0,<3.5.0",
11
- "spacy_git_version":"dd038b536",
12
  "vectors":{
13
  "width":300,
14
  "vectors":500002,
@@ -953,70 +953,70 @@
953
  "senter"
954
  ],
955
  "performance":{
956
- "token_acc":0.9984047451,
957
- "token_p":0.9727635194,
958
- "token_r":0.9831678569,
959
- "token_f":0.9779380158,
960
- "pos_acc":0.9889933439,
961
- "morph_acc":0.9747833538,
962
- "morph_micro_p":0.9896991632,
963
- "morph_micro_r":0.9832782178,
964
- "morph_micro_f":0.9864782422,
965
  "morph_per_feat":{
966
  "Animacy":{
967
- "p":0.9896970764,
968
- "r":0.980088367,
969
- "f":0.9848692858
970
  },
971
  "Case":{
972
- "p":0.9789719626,
973
- "r":0.9722662264,
974
- "f":0.9756075718
975
  },
976
  "Gender":{
977
- "p":0.9880955025,
978
- "r":0.9819453948,
979
- "f":0.9850108489
980
  },
981
  "Number":{
982
- "p":0.9960197873,
983
- "r":0.9897728557,
984
- "f":0.9928864957
985
  },
986
  "Degree":{
987
- "p":0.9885778967,
988
- "r":0.9863449692,
989
- "f":0.9874601706
990
  },
991
  "Aspect":{
992
- "p":0.9905277402,
993
- "r":0.9869662921,
994
- "f":0.9887438091
995
  },
996
  "Mood":{
997
- "p":0.9986340494,
998
- "r":0.9970245475,
999
- "f":0.9978286494
1000
  },
1001
  "Tense":{
1002
- "p":0.9932989691,
1003
- "r":0.9896261298,
1004
- "f":0.991459148
1005
  },
1006
  "VerbForm":{
1007
- "p":0.9952187641,
1008
- "r":0.9916404494,
1009
- "f":0.9934263845
1010
  },
1011
  "Voice":{
1012
- "p":0.9910690122,
1013
- "r":0.987505618,
1014
- "f":0.9892841063
1015
  },
1016
  "StyleVariant":{
1017
- "p":0.9931170108,
1018
- "r":0.9960552268,
1019
- "f":0.9945839488
1020
  },
1021
  "Polarity":{
1022
  "p":1.0,
@@ -1024,14 +1024,14 @@
1024
  "f":1.0
1025
  },
1026
  "Person":{
1027
- "p":0.9997729852,
1028
- "r":0.9934581547,
1029
- "f":0.9966055669
1030
  },
1031
  "Foreign":{
1032
- "p":0.9700483092,
1033
- "r":0.8685121107,
1034
- "f":0.9164764948
1035
  },
1036
  "Hyph":{
1037
  "p":0.0,
@@ -1039,186 +1039,186 @@
1039
  "f":0.0
1040
  }
1041
  },
1042
- "sents_p":0.9986684421,
1043
- "sents_r":0.9988584475,
1044
- "sents_f":0.9987634357,
1045
- "dep_uas":0.9630346126,
1046
- "dep_las":0.9520673253,
1047
  "dep_las_per_type":{
1048
  "case":{
1049
- "p":0.9938650307,
1050
- "r":0.9893826928,
1051
- "f":0.9916187965
1052
  },
1053
  "parataxis":{
1054
- "p":0.878342246,
1055
- "r":0.8499353169,
1056
- "f":0.8639053254
1057
  },
1058
  "nmod":{
1059
- "p":0.9342683497,
1060
- "r":0.9280208043,
1061
- "f":0.9311340975
1062
  },
1063
  "advmod":{
1064
- "p":0.9611451943,
1065
- "r":0.9530246705,
1066
- "f":0.9570677074
1067
  },
1068
  "obl":{
1069
- "p":0.9446489434,
1070
- "r":0.9377452971,
1071
- "f":0.9411844607
1072
  },
1073
  "amod":{
1074
- "p":0.9890609462,
1075
- "r":0.9844457014,
1076
- "f":0.9867479271
1077
  },
1078
  "nsubj":{
1079
- "p":0.9695295232,
1080
- "r":0.9696826149,
1081
- "f":0.969606063
1082
  },
1083
  "root":{
1084
- "p":0.9899066844,
1085
- "r":0.9889649924,
1086
- "f":0.9894356144
1087
  },
1088
  "xcomp":{
1089
- "p":0.9630188679,
1090
- "r":0.9696048632,
1091
- "f":0.9663006437
1092
  },
1093
  "conj":{
1094
- "p":0.8997961957,
1095
- "r":0.9090597117,
1096
- "f":0.9044042335
1097
  },
1098
  "cc":{
1099
- "p":0.9761235955,
1100
- "r":0.9752104771,
1101
- "f":0.9756668226
1102
  },
1103
  "fixed":{
1104
- "p":0.9860228717,
1105
- "r":0.9872773537,
1106
- "f":0.9866497139
1107
  },
1108
  "mark":{
1109
- "p":0.9674690956,
1110
- "r":0.9706266319,
1111
- "f":0.9690452916
1112
  },
1113
  "ccomp":{
1114
- "p":0.976016684,
1115
- "r":0.9790794979,
1116
- "f":0.9775456919
1117
  },
1118
  "nummod:gov":{
1119
- "p":0.9726315789,
1120
- "r":0.9625,
1121
- "f":0.967539267
1122
  },
1123
  "nummod":{
1124
- "p":0.9629310345,
1125
- "r":0.9482173175,
1126
- "f":0.9555175364
1127
  },
1128
  "obj":{
1129
- "p":0.9708791209,
1130
- "r":0.9655737705,
1131
- "f":0.9682191781
1132
  },
1133
  "det":{
1134
- "p":0.9680696662,
1135
- "r":0.9638728324,
1136
- "f":0.9659666908
1137
  },
1138
  "appos":{
1139
- "p":0.8946873531,
1140
- "r":0.8174398625,
1141
- "f":0.8543209877
1142
  },
1143
  "aux":{
1144
- "p":0.9714285714,
1145
- "r":0.9714285714,
1146
- "f":0.9714285714
1147
  },
1148
  "flat":{
1149
- "p":0.9952718676,
1150
- "r":0.9589977221,
1151
- "f":0.9767981439
1152
  },
1153
  "flat:name":{
1154
- "p":0.976016684,
1155
- "r":0.9669421488,
1156
- "f":0.9714582252
1157
  },
1158
  "iobj":{
1159
- "p":0.9184782609,
1160
- "r":0.8492462312,
1161
- "f":0.8825065274
1162
  },
1163
  "acl":{
1164
- "p":0.9164524422,
1165
- "r":0.8901373283,
1166
- "f":0.9031032299
1167
  },
1168
  "obl:agent":{
1169
- "p":0.7125,
1170
- "r":0.75,
1171
- "f":0.7307692308
1172
  },
1173
  "advcl":{
1174
- "p":0.8886310905,
1175
  "r":0.8744292237,
1176
- "f":0.8814729574
1177
  },
1178
  "cop":{
1179
- "p":0.9361702128,
1180
- "r":0.9166666667,
1181
- "f":0.9263157895
1182
  },
1183
  "flat:foreign":{
1184
- "p":0.949602122,
1185
- "r":0.8136363636,
1186
- "f":0.876376989
1187
  },
1188
  "aux:pass":{
1189
- "p":0.9884393064,
1190
- "r":0.9799426934,
1191
- "f":0.9841726619
1192
  },
1193
  "nsubj:pass":{
1194
- "p":0.9588235294,
1195
- "r":0.9518248175,
1196
- "f":0.9553113553
1197
  },
1198
  "acl:relcl":{
1199
- "p":0.8252631579,
1200
- "r":0.8049281314,
1201
- "f":0.814968815
1202
  },
1203
  "orphan":{
1204
- "p":0.78125,
1205
  "r":0.6944444444,
1206
- "f":0.7352941176
1207
  },
1208
  "discourse":{
1209
- "p":0.75,
1210
- "r":0.9230769231,
1211
- "f":0.8275862069
1212
  },
1213
  "csubj":{
1214
- "p":0.9705882353,
1215
- "r":0.9295774648,
1216
- "f":0.9496402878
1217
  },
1218
  "expl":{
1219
- "p":0.7894736842,
1220
  "r":0.7894736842,
1221
- "f":0.7894736842
1222
  },
1223
  "compound":{
1224
  "p":1.0,
@@ -1226,9 +1226,9 @@
1226
  "f":0.4615384615
1227
  },
1228
  "csubj:pass":{
1229
- "p":0.9,
1230
  "r":0.8181818182,
1231
- "f":0.8571428571
1232
  },
1233
  "nummod:entity":{
1234
  "p":1.0,
@@ -1241,29 +1241,29 @@
1241
  "f":0.0
1242
  }
1243
  },
1244
- "tag_acc":0.9889933439,
1245
- "lemma_acc":0.0000215292,
1246
- "ents_p":0.9520121233,
1247
- "ents_r":0.9516916344,
1248
- "ents_f":0.9518518519,
1249
  "ents_per_type":{
1250
  "PER":{
1251
- "p":0.9595278246,
1252
- "r":0.9584503088,
1253
- "f":0.958988764
1254
  },
1255
  "LOC":{
1256
- "p":0.9754485364,
1257
- "r":0.9759093056,
1258
- "f":0.9756788666
1259
  },
1260
  "ORG":{
1261
- "p":0.9211557297,
1262
- "r":0.9207048458,
1263
- "f":0.9209302326
1264
  }
1265
  },
1266
- "speed":3393.7960657989
1267
  },
1268
  "sources":[
1269
  {
@@ -1280,6 +1280,6 @@
1280
  }
1281
  ],
1282
  "requirements":[
1283
- "pymorphy2>=0.9"
1284
  ]
1285
  }
1
  {
2
  "lang":"ru",
3
  "name":"core_news_lg",
4
+ "version":"3.5.0",
5
  "description":"Russian pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, senter, ner, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
+ "spacy_version":">=3.5.0,<3.6.0",
11
+ "spacy_git_version":"9e0322de1",
12
  "vectors":{
13
  "width":300,
14
  "vectors":500002,
953
  "senter"
954
  ],
955
  "performance":{
956
+ "token_acc":0.9968038482,
957
+ "token_p":0.9727525387,
958
+ "token_r":0.9831462495,
959
+ "token_f":0.9779217779,
960
+ "pos_acc":0.989280677,
961
+ "morph_acc":0.9749177029,
962
+ "morph_micro_p":0.9897327316,
963
+ "morph_micro_r":0.9829975554,
964
+ "morph_micro_f":0.9863536461,
965
  "morph_per_feat":{
966
  "Animacy":{
967
+ "p":0.9905472053,
968
+ "r":0.9808150689,
969
+ "f":0.9856571145
970
  },
971
  "Case":{
972
+ "p":0.9776694449,
973
+ "r":0.9709944443,
974
+ "f":0.9743205122
975
  },
976
  "Gender":{
977
+ "p":0.9884699976,
978
+ "r":0.982055753,
979
+ "f":0.9852524358
980
  },
981
  "Number":{
982
+ "p":0.9958673769,
983
+ "r":0.9894338343,
984
+ "f":0.9926401814
985
  },
986
  "Degree":{
987
+ "p":0.9884927566,
988
+ "r":0.9877823409,
989
+ "f":0.988137421
990
  },
991
  "Aspect":{
992
+ "p":0.9913263462,
993
+ "r":0.986247191,
994
+ "f":0.988780246
995
  },
996
  "Mood":{
997
+ "p":0.9990060877,
998
+ "r":0.9969005703,
999
+ "f":0.9979522184
1000
  },
1001
  "Tense":{
1002
+ "p":0.99442264,
1003
+ "r":0.9889071487,
1004
+ "f":0.9916572253
1005
  },
1006
  "VerbForm":{
1007
+ "p":0.9958438742,
1008
+ "r":0.990741573,
1009
+ "f":0.9932861713
1010
  },
1011
  "Voice":{
1012
+ "p":0.9914166968,
1013
+ "r":0.9863370787,
1014
+ "f":0.9888703645
1015
  },
1016
  "StyleVariant":{
1017
+ "p":0.989194499,
1018
+ "r":0.9930966469,
1019
+ "f":0.9911417323
1020
  },
1021
  "Polarity":{
1022
  "p":1.0,
1024
  "f":1.0
1025
  },
1026
  "Person":{
1027
+ "p":0.9995459705,
1028
+ "r":0.9932325739,
1029
+ "f":0.9963792713
1030
  },
1031
  "Foreign":{
1032
+ "p":0.9711260828,
1033
+ "r":0.8728373702,
1034
+ "f":0.9193621868
1035
  },
1036
  "Hyph":{
1037
  "p":0.0,
1039
  "f":0.0
1040
  }
1041
  },
1042
+ "sents_p":0.9986679353,
1043
+ "sents_r":0.99847793,
1044
+ "sents_f":0.9985729236,
1045
+ "dep_uas":0.962198055,
1046
+ "dep_las":0.9511948091,
1047
  "dep_las_per_type":{
1048
  "case":{
1049
+ "p":0.9918025064,
1050
+ "r":0.989006859,
1051
+ "f":0.9904027098
1052
  },
1053
  "parataxis":{
1054
+ "p":0.8842034806,
1055
+ "r":0.8544631307,
1056
+ "f":0.8690789474
1057
  },
1058
  "nmod":{
1059
+ "p":0.9328846513,
1060
+ "r":0.9269062877,
1061
+ "f":0.9298858607
1062
  },
1063
  "advmod":{
1064
+ "p":0.9554118448,
1065
+ "r":0.9486312944,
1066
+ "f":0.9520094964
1067
  },
1068
  "obl":{
1069
+ "p":0.9425224734,
1070
+ "r":0.9365272703,
1071
+ "f":0.9395153079
1072
  },
1073
  "amod":{
1074
+ "p":0.9893299189,
1075
+ "r":0.9833144796,
1076
+ "f":0.9863130274
1077
  },
1078
  "nsubj":{
1079
+ "p":0.9722486521,
1080
+ "r":0.9681035844,
1081
+ "f":0.9701716908
1082
  },
1083
  "root":{
1084
+ "p":0.9893313012,
1085
+ "r":0.9880136986,
1086
+ "f":0.9886720609
1087
  },
1088
  "xcomp":{
1089
+ "p":0.9570135747,
1090
+ "r":0.9642857143,
1091
+ "f":0.9606358819
1092
  },
1093
  "conj":{
1094
+ "p":0.8906144497,
1095
+ "r":0.9052848318,
1096
+ "f":0.8978897209
1097
  },
1098
  "cc":{
1099
+ "p":0.9746597841,
1100
+ "r":0.9714686623,
1101
+ "f":0.9730616069
1102
  },
1103
  "fixed":{
1104
+ "p":0.9835025381,
1105
+ "r":0.9860050891,
1106
+ "f":0.9847522236
1107
  },
1108
  "mark":{
1109
+ "p":0.9681197137,
1110
+ "r":0.9712793734,
1111
+ "f":0.9696969697
1112
  },
1113
  "ccomp":{
1114
+ "p":0.978125,
1115
+ "r":0.9822175732,
1116
+ "f":0.9801670146
1117
  },
1118
  "nummod:gov":{
1119
+ "p":0.9684210526,
1120
+ "r":0.9583333333,
1121
+ "f":0.9633507853
1122
  },
1123
  "nummod":{
1124
+ "p":0.9664948454,
1125
+ "r":0.955008489,
1126
+ "f":0.9607173356
1127
  },
1128
  "obj":{
1129
+ "p":0.9738364087,
1130
+ "r":0.9661202186,
1131
+ "f":0.969962968
1132
  },
1133
  "det":{
1134
+ "p":0.976,
1135
+ "r":0.9696531792,
1136
+ "f":0.9728162378
1137
  },
1138
  "appos":{
1139
+ "p":0.8951881848,
1140
+ "r":0.8071305842,
1141
+ "f":0.8488818613
1142
  },
1143
  "aux":{
1144
+ "p":0.9619047619,
1145
+ "r":0.9619047619,
1146
+ "f":0.9619047619
1147
  },
1148
  "flat":{
1149
+ "p":0.9929411765,
1150
+ "r":0.9612756264,
1151
+ "f":0.9768518519
1152
  },
1153
  "flat:name":{
1154
+ "p":0.9759665622,
1155
+ "r":0.9648760331,
1156
+ "f":0.9703896104
1157
  },
1158
  "iobj":{
1159
+ "p":0.9176788124,
1160
+ "r":0.8542713568,
1161
+ "f":0.8848405986
1162
  },
1163
  "acl":{
1164
+ "p":0.9232769831,
1165
+ "r":0.88639201,
1166
+ "f":0.9044585987
1167
  },
1168
  "obl:agent":{
1169
+ "p":0.7792207792,
1170
+ "r":0.7894736842,
1171
+ "f":0.7843137255
1172
  },
1173
  "advcl":{
1174
+ "p":0.8665158371,
1175
  "r":0.8744292237,
1176
+ "f":0.8704545455
1177
  },
1178
  "cop":{
1179
+ "p":0.9246575342,
1180
+ "r":0.9375,
1181
+ "f":0.9310344828
1182
  },
1183
  "flat:foreign":{
1184
+ "p":0.963060686,
1185
+ "r":0.8295454545,
1186
+ "f":0.8913308913
1187
  },
1188
  "aux:pass":{
1189
+ "p":0.9913294798,
1190
+ "r":0.9828080229,
1191
+ "f":0.9870503597
1192
  },
1193
  "nsubj:pass":{
1194
+ "p":0.9505813953,
1195
+ "r":0.9547445255,
1196
+ "f":0.9526584122
1197
  },
1198
  "acl:relcl":{
1199
+ "p":0.8177966102,
1200
+ "r":0.7926078029,
1201
+ "f":0.8050052138
1202
  },
1203
  "orphan":{
1204
+ "p":0.7352941176,
1205
  "r":0.6944444444,
1206
+ "f":0.7142857143
1207
  },
1208
  "discourse":{
1209
+ "p":0.9117647059,
1210
+ "r":0.9538461538,
1211
+ "f":0.9323308271
1212
  },
1213
  "csubj":{
1214
+ "p":0.964028777,
1215
+ "r":0.9436619718,
1216
+ "f":0.9537366548
1217
  },
1218
  "expl":{
1219
+ "p":0.8823529412,
1220
  "r":0.7894736842,
1221
+ "f":0.8333333333
1222
  },
1223
  "compound":{
1224
  "p":1.0,
1226
  "f":0.4615384615
1227
  },
1228
  "csubj:pass":{
1229
+ "p":0.8181818182,
1230
  "r":0.8181818182,
1231
+ "f":0.8181818182
1232
  },
1233
  "nummod:entity":{
1234
  "p":1.0,
1241
  "f":0.0
1242
  }
1243
  },
1244
+ "tag_acc":0.989280677,
1245
+ "lemma_acc":0.0000215295,
1246
+ "ents_p":0.9524209818,
1247
+ "ents_r":0.9535431745,
1248
+ "ents_f":0.9529817478,
1249
  "ents_per_type":{
1250
  "PER":{
1251
+ "p":0.9641456583,
1252
+ "r":0.9663110612,
1253
+ "f":0.9652271453
1254
  },
1255
  "LOC":{
1256
+ "p":0.9740566038,
1257
+ "r":0.9754369391,
1258
+ "f":0.9747462827
1259
  },
1260
  "ORG":{
1261
+ "p":0.9197258933,
1262
+ "r":0.9197258933,
1263
+ "f":0.9197258933
1264
  }
1265
  },
1266
+ "speed":2459.2661417009
1267
  },
1268
  "sources":[
1269
  {
1280
  }
1281
  ],
1282
  "requirements":[
1283
+ "pymorphy3>=1.0.0"
1284
  ]
1285
  }
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f863c33a7169482d14f6310893490b5fe24ad46559b5798a2aa13d6685d20083
3
  size 332570
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f2c87e0709abfb93ecf0f0cd6699fe96e1d0b7b2e932fe8cd94db75792184f2
3
  size 332570
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2b969fb90be6de0016d964f0ee60706f2eea662ada8be0fcb477bda322fe94d
3
- size 6495552
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57ad451f06a4bf3df4481e1cbadd41ac2ab565c54f00ad54048704bc82a15802
3
+ size 6365342
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29eef671a005be011caa904efffbf30c833ff645b59c8b0be5d001124b5b2c9d
3
  size 312369
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55b78e21229a03b2a66256305fceefb42a4fc1f7d36305fd41106e6ea1ada13c
3
  size 312369
ru_core_news_lg-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e982fb05f90f9343c5e722758e996200c56850c566fb892ff0d87e7908180e38
3
- size 513366919
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e76e86d4c5008296cf77c9080269908ea4097794585f6e956b3462ad5e8c037
3
+ size 513368441
senter/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44d0c0bc2a42385486383f5aad47d29ef07fbe53b63d19cb3ec2a34289a47e7b
3
  size 219953
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c54de08c5e463cd9f40db227ebe0ebb153c0cfc1646b2d2b8ac74bed18120fdf
3
  size 219953
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0808477cbbbede63a990cb66bf83a08e155c06b6970d4c345ad34f5873351c6c
3
- size 6365604
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:155130b76ccce19a638c3c2464aa8b5554f6131c72e2b2b87974a00d70308250
3
+ size 6495793
tokenizer CHANGED
The diff for this file is too large to render. See raw diff
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80a194c976452ce9e08dcbb3e0cc44dbe4e3e55b9306749dd798b9396e9ab477
3
- size 49011229
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:967899b299d4c01affbceff241c8c8546b171c66d05a57fe8dc078c192759284
3
+ size 49011292