adrianeboyd commited on
Commit
7538d68
1 Parent(s): 7069fb2

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,27 +14,27 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.754691689
18
  - name: NER Recall
19
  type: recall
20
- value: 0.7081761006
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.7306943543
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
- value: 0.9712488769
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
- value: 0.9749672775
38
  - task:
39
  name: MORPH
40
  type: token-classification
@@ -55,21 +55,21 @@ model-index:
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
- value: 0.9233540485
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
- value: 0.9101052821
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
- value: 0.9658536585
73
  ---
74
  ### Details: https://spacy.io/models/ja#ja_core_news_lg
75
 
@@ -78,8 +78,8 @@ Japanese pipeline optimized for CPU. Components: tok2vec, morphologizer, parser,
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `ja_core_news_lg` |
81
- | **Version** | `3.5.0` |
82
- | **spaCy** | `>=3.5.0,<3.6.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `senter`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 480443 keys, 480443 unique vectors (300 dimensions) |
@@ -109,18 +109,18 @@ Japanese pipeline optimized for CPU. Components: tok2vec, morphologizer, parser,
109
  | `TOKEN_P` | 97.65 |
110
  | `TOKEN_R` | 97.90 |
111
  | `TOKEN_F` | 97.77 |
112
- | `POS_ACC` | 97.50 |
113
  | `MORPH_ACC` | 0.00 |
114
  | `MORPH_MICRO_P` | 34.01 |
115
  | `MORPH_MICRO_R` | 98.04 |
116
  | `MORPH_MICRO_F` | 50.51 |
117
- | `SENTS_P` | 95.56 |
118
- | `SENTS_R` | 97.63 |
119
- | `SENTS_F` | 96.59 |
120
- | `DEP_UAS` | 92.34 |
121
- | `DEP_LAS` | 91.01 |
122
- | `TAG_ACC` | 97.12 |
123
  | `LEMMA_ACC` | 96.71 |
124
- | `ENTS_P` | 75.47 |
125
- | `ENTS_R` | 70.82 |
126
- | `ENTS_F` | 73.07 |
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.749661705
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.6968553459
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.7222946545
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.9713305562
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
+ value: 0.9730437272
38
  - task:
39
  name: MORPH
40
  type: token-classification
 
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
+ value: 0.9221626975
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
+ value: 0.9081013
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
+ value: 0.9716520039
73
  ---
74
  ### Details: https://spacy.io/models/ja#ja_core_news_lg
75
 
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `ja_core_news_lg` |
81
+ | **Version** | `3.6.0` |
82
+ | **spaCy** | `>=3.6.0,<3.7.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `senter`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 480443 keys, 480443 unique vectors (300 dimensions) |
 
109
  | `TOKEN_P` | 97.65 |
110
  | `TOKEN_R` | 97.90 |
111
  | `TOKEN_F` | 97.77 |
112
+ | `POS_ACC` | 97.30 |
113
  | `MORPH_ACC` | 0.00 |
114
  | `MORPH_MICRO_P` | 34.01 |
115
  | `MORPH_MICRO_R` | 98.04 |
116
  | `MORPH_MICRO_F` | 50.51 |
117
+ | `SENTS_P` | 96.32 |
118
+ | `SENTS_R` | 98.03 |
119
+ | `SENTS_F` | 97.17 |
120
+ | `DEP_UAS` | 92.22 |
121
+ | `DEP_LAS` | 90.81 |
122
+ | `TAG_ACC` | 97.13 |
123
  | `LEMMA_ACC` | 96.71 |
124
+ | `ENTS_P` | 74.97 |
125
+ | `ENTS_R` | 69.69 |
126
+ | `ENTS_F` | 72.23 |
accuracy.json CHANGED
@@ -3,7 +3,7 @@
3
  "token_p": 0.9764591282,
4
  "token_r": 0.9790021974,
5
  "token_f": 0.9777290092,
6
- "pos_acc": 0.9749672775,
7
  "morph_acc": 0.0,
8
  "morph_micro_p": 0.3401360544,
9
  "morph_micro_r": 0.9803921569,
@@ -25,81 +25,81 @@
25
  "f": 0.0
26
  }
27
  },
28
- "sents_p": 0.9555984556,
29
- "sents_r": 0.9763313609,
30
- "sents_f": 0.9658536585,
31
- "dep_uas": 0.9233540485,
32
- "dep_las": 0.9101052821,
33
  "dep_las_per_type": {
34
  "cc": {
35
- "p": 0.7826086957,
36
- "r": 0.75,
37
- "f": 0.7659574468
38
  },
39
  "compound": {
40
- "p": 0.9399066511,
41
- "r": 0.9081172492,
42
- "f": 0.9237385321
43
  },
44
  "obl": {
45
- "p": 0.8310038119,
46
- "r": 0.8164794007,
47
- "f": 0.8236775819
48
  },
49
  "case": {
50
- "p": 0.9907940161,
51
- "r": 0.9813829787,
52
- "f": 0.9860660431
53
  },
54
  "dislocated": {
55
- "p": 0.5454545455,
56
- "r": 0.4615384615,
57
- "f": 0.5
58
  },
59
  "nsubj": {
60
- "p": 0.8359073359,
61
- "r": 0.8310940499,
62
- "f": 0.833493744
63
  },
64
  "nmod": {
65
- "p": 0.8835192069,
66
- "r": 0.8339181287,
67
- "f": 0.8580024067
68
  },
69
  "root": {
70
- "p": 0.9569471624,
71
  "r": 0.9644970414,
72
- "f": 0.9607072692
73
  },
74
  "aux": {
75
- "p": 0.9796672828,
76
- "r": 0.9842154132,
77
- "f": 0.9819360815
78
  },
79
  "advcl": {
80
- "p": 0.6888888889,
81
- "r": 0.6966292135,
82
- "f": 0.6927374302
83
  },
84
  "mark": {
85
- "p": 0.9777777778,
86
- "r": 0.968,
87
- "f": 0.9728643216
88
  },
89
  "fixed": {
90
- "p": 0.9621621622,
91
- "r": 0.9709090909,
92
- "f": 0.9665158371
93
  },
94
  "acl": {
95
- "p": 0.8422222222,
96
- "r": 0.832967033,
97
- "f": 0.8375690608
98
  },
99
  "obj": {
100
- "p": 0.9476923077,
101
- "r": 0.9305135952,
102
- "f": 0.9390243902
103
  },
104
  "nummod": {
105
  "p": 0.9805194805,
@@ -107,34 +107,34 @@
107
  "f": 0.9349845201
108
  },
109
  "advmod": {
110
- "p": 0.6739130435,
111
- "r": 0.6642857143,
112
- "f": 0.6690647482
113
  },
114
  "amod": {
115
- "p": 0.8709677419,
116
  "r": 0.7297297297,
117
- "f": 0.7941176471
118
  },
119
  "cop": {
120
- "p": 0.9640718563,
121
- "r": 0.9360465116,
122
- "f": 0.9498525074
123
  },
124
  "ccomp": {
125
- "p": 1.0,
126
- "r": 0.9545454545,
127
- "f": 0.976744186
128
  },
129
  "det": {
130
- "p": 1.0,
131
- "r": 0.9811320755,
132
- "f": 0.9904761905
133
  },
134
  "csubj": {
135
- "p": 0.6153846154,
136
- "r": 0.6666666667,
137
- "f": 0.64
138
  },
139
  "dep": {
140
  "p": 0.25,
@@ -142,101 +142,101 @@
142
  "f": 0.1818181818
143
  }
144
  },
145
- "tag_acc": 0.9712488769,
146
  "lemma_acc": 0.9670526831,
147
- "ents_p": 0.754691689,
148
- "ents_r": 0.7081761006,
149
- "ents_f": 0.7306943543,
150
  "ents_per_type": {
151
  "DATE": {
152
- "p": 0.9363636364,
153
- "r": 0.9449541284,
154
- "f": 0.9406392694
155
  },
156
  "ORG": {
157
- "p": 0.6456692913,
158
- "r": 0.598540146,
159
- "f": 0.6212121212
160
  },
161
  "PERSON": {
162
- "p": 0.7666666667,
163
- "r": 0.8273381295,
164
- "f": 0.7958477509
165
  },
166
  "GPE": {
167
- "p": 0.7386363636,
168
  "r": 0.6914893617,
169
- "f": 0.7142857143
170
  },
171
  "TIME": {
172
- "p": 0.5,
173
  "r": 1.0,
174
- "f": 0.6666666667
175
  },
176
  "QUANTITY": {
177
- "p": 0.8923076923,
178
- "r": 0.8787878788,
179
- "f": 0.8854961832
180
  },
181
  "NORP": {
182
- "p": 0.7037037037,
183
  "r": 0.59375,
184
- "f": 0.6440677966
185
  },
186
  "TITLE_AFFIX": {
187
- "p": 0.8,
188
- "r": 0.6666666667,
189
- "f": 0.7272727273
190
  },
191
  "ORDINAL": {
192
- "p": 0.5652173913,
193
- "r": 0.5909090909,
194
- "f": 0.5777777778
195
  },
196
  "WORK_OF_ART": {
197
- "p": 0.75,
198
- "r": 0.7058823529,
199
- "f": 0.7272727273
200
  },
201
  "CARDINAL": {
202
- "p": 0.5,
203
  "r": 0.5,
204
- "f": 0.5
205
  },
206
- "FAC": {
207
  "p": 0.6666666667,
208
- "r": 0.4324324324,
209
- "f": 0.5245901639
210
  },
211
  "EVENT": {
212
- "p": 0.6956521739,
213
- "r": 0.6153846154,
214
- "f": 0.6530612245
215
- },
216
- "PERCENT": {
217
- "p": 1.0,
218
- "r": 0.2857142857,
219
- "f": 0.4444444444
220
  },
221
  "LOC": {
222
- "p": 0.75,
223
- "r": 0.9,
224
- "f": 0.8181818182
225
  },
226
- "PRODUCT": {
227
- "p": 0.5384615385,
228
- "r": 0.3333333333,
229
- "f": 0.4117647059
230
  },
231
  "MOVEMENT": {
232
  "p": 0.0,
233
  "r": 0.0,
234
  "f": 0.0
235
  },
 
 
 
 
 
236
  "LAW": {
237
- "p": 1.0,
238
- "r": 0.3333333333,
239
- "f": 0.5
240
  },
241
  "MONEY": {
242
  "p": 1.0,
@@ -247,12 +247,7 @@
247
  "p": 1.0,
248
  "r": 1.0,
249
  "f": 1.0
250
- },
251
- "PET_NAME": {
252
- "p": 0.0,
253
- "r": 0.0,
254
- "f": 0.0
255
  }
256
  },
257
- "speed": 9928.6122863321
258
  }
 
3
  "token_p": 0.9764591282,
4
  "token_r": 0.9790021974,
5
  "token_f": 0.9777290092,
6
+ "pos_acc": 0.9730437272,
7
  "morph_acc": 0.0,
8
  "morph_micro_p": 0.3401360544,
9
  "morph_micro_r": 0.9803921569,
 
25
  "f": 0.0
26
  }
27
  },
28
+ "sents_p": 0.9631782946,
29
+ "sents_r": 0.9802761341,
30
+ "sents_f": 0.9716520039,
31
+ "dep_uas": 0.9221626975,
32
+ "dep_las": 0.9081013,
33
  "dep_las_per_type": {
34
  "cc": {
35
+ "p": 0.847826087,
36
+ "r": 0.8125,
37
+ "f": 0.829787234
38
  },
39
  "compound": {
40
+ "p": 0.9406976744,
41
+ "r": 0.9120631342,
42
+ "f": 0.9261591299
43
  },
44
  "obl": {
45
+ "p": 0.8122653317,
46
+ "r": 0.8102372035,
47
+ "f": 0.81125
48
  },
49
  "case": {
50
+ "p": 0.990403071,
51
+ "r": 0.9802431611,
52
+ "f": 0.9852969257
53
  },
54
  "dislocated": {
55
+ "p": 0.5882352941,
56
+ "r": 0.7692307692,
57
+ "f": 0.6666666667
58
  },
59
  "nsubj": {
60
+ "p": 0.8307392996,
61
+ "r": 0.8195777351,
62
+ "f": 0.8251207729
63
  },
64
  "nmod": {
65
+ "p": 0.8955974843,
66
+ "r": 0.832748538,
67
+ "f": 0.863030303
68
  },
69
  "root": {
70
+ "p": 0.9607072692,
71
  "r": 0.9644970414,
72
+ "f": 0.9625984252
73
  },
74
  "aux": {
75
+ "p": 0.9832713755,
76
+ "r": 0.982358403,
77
+ "f": 0.9828146772
78
  },
79
  "advcl": {
80
+ "p": 0.6614349776,
81
+ "r": 0.6629213483,
82
+ "f": 0.6621773288
83
  },
84
  "mark": {
85
+ "p": 0.9658634538,
86
+ "r": 0.962,
87
+ "f": 0.9639278557
88
  },
89
  "fixed": {
90
+ "p": 0.9550359712,
91
+ "r": 0.9654545455,
92
+ "f": 0.9602169982
93
  },
94
  "acl": {
95
+ "p": 0.8377192982,
96
+ "r": 0.8395604396,
97
+ "f": 0.8386388584
98
  },
99
  "obj": {
100
+ "p": 0.9661538462,
101
+ "r": 0.9486404834,
102
+ "f": 0.9573170732
103
  },
104
  "nummod": {
105
  "p": 0.9805194805,
 
107
  "f": 0.9349845201
108
  },
109
  "advmod": {
110
+ "p": 0.6474820144,
111
+ "r": 0.6428571429,
112
+ "f": 0.6451612903
113
  },
114
  "amod": {
115
+ "p": 0.9,
116
  "r": 0.7297297297,
117
+ "f": 0.8059701493
118
  },
119
  "cop": {
120
+ "p": 0.9467455621,
121
+ "r": 0.9302325581,
122
+ "f": 0.9384164223
123
  },
124
  "ccomp": {
125
+ "p": 0.95,
126
+ "r": 0.8636363636,
127
+ "f": 0.9047619048
128
  },
129
  "det": {
130
+ "p": 0.9807692308,
131
+ "r": 0.9622641509,
132
+ "f": 0.9714285714
133
  },
134
  "csubj": {
135
+ "p": 0.6666666667,
136
+ "r": 0.8333333333,
137
+ "f": 0.7407407407
138
  },
139
  "dep": {
140
  "p": 0.25,
 
142
  "f": 0.1818181818
143
  }
144
  },
145
+ "tag_acc": 0.9713305562,
146
  "lemma_acc": 0.9670526831,
147
+ "ents_p": 0.749661705,
148
+ "ents_r": 0.6968553459,
149
+ "ents_f": 0.7222946545,
150
  "ents_per_type": {
151
  "DATE": {
152
+ "p": 0.9459459459,
153
+ "r": 0.9633027523,
154
+ "f": 0.9545454545
155
  },
156
  "ORG": {
157
+ "p": 0.6209677419,
158
+ "r": 0.5620437956,
159
+ "f": 0.5900383142
160
  },
161
  "PERSON": {
162
+ "p": 0.7622377622,
163
+ "r": 0.7841726619,
164
+ "f": 0.7730496454
165
  },
166
  "GPE": {
167
+ "p": 0.7738095238,
168
  "r": 0.6914893617,
169
+ "f": 0.7303370787
170
  },
171
  "TIME": {
172
+ "p": 0.5714285714,
173
  "r": 1.0,
174
+ "f": 0.7272727273
175
  },
176
  "QUANTITY": {
177
+ "p": 0.921875,
178
+ "r": 0.8939393939,
179
+ "f": 0.9076923077
180
  },
181
  "NORP": {
182
+ "p": 0.6785714286,
183
  "r": 0.59375,
184
+ "f": 0.6333333333
185
  },
186
  "TITLE_AFFIX": {
187
+ "p": 0.72,
188
+ "r": 0.6,
189
+ "f": 0.6545454545
190
  },
191
  "ORDINAL": {
192
+ "p": 0.6,
193
+ "r": 0.6818181818,
194
+ "f": 0.6382978723
195
  },
196
  "WORK_OF_ART": {
197
+ "p": 0.7857142857,
198
+ "r": 0.6470588235,
199
+ "f": 0.7096774194
200
  },
201
  "CARDINAL": {
202
+ "p": 1.0,
203
  "r": 0.5,
204
+ "f": 0.6666666667
205
  },
206
+ "PERCENT": {
207
  "p": 0.6666666667,
208
+ "r": 0.2857142857,
209
+ "f": 0.4
210
  },
211
  "EVENT": {
212
+ "p": 0.7894736842,
213
+ "r": 0.5769230769,
214
+ "f": 0.6666666667
 
 
 
 
 
215
  },
216
  "LOC": {
217
+ "p": 0.5333333333,
218
+ "r": 0.8,
219
+ "f": 0.64
220
  },
221
+ "FAC": {
222
+ "p": 0.5862068966,
223
+ "r": 0.4594594595,
224
+ "f": 0.5151515152
225
  },
226
  "MOVEMENT": {
227
  "p": 0.0,
228
  "r": 0.0,
229
  "f": 0.0
230
  },
231
+ "PRODUCT": {
232
+ "p": 0.5517241379,
233
+ "r": 0.380952381,
234
+ "f": 0.4507042254
235
+ },
236
  "LAW": {
237
+ "p": 0.0,
238
+ "r": 0.0,
239
+ "f": 0.0
240
  },
241
  "MONEY": {
242
  "p": 1.0,
 
247
  "p": 1.0,
248
  "r": 1.0,
249
  "f": 1.0
 
 
 
 
 
250
  }
251
  },
252
+ "speed": 8423.8901639919
253
  }
ja_core_news_lg-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:457d095ddd2243b4546fa5188a9ebd1ac622ba1178ecf0d8517b7334241b4c2c
3
- size 555256203
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db8020348eb16bd4ce01db1a0dcde65b40f7c95c7aa6235d501f0801ca0eb556
3
+ size 555248990
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"ja",
3
  "name":"core_news_lg",
4
- "version":"3.5.0",
5
  "description":"Japanese pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, senter, ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
- "spacy_version":">=3.5.0,<3.6.0",
11
- "spacy_git_version":"9e0322de1",
12
  "vectors":{
13
  "width":300,
14
  "vectors":480443,
@@ -117,7 +117,7 @@
117
  "token_p":0.9764591282,
118
  "token_r":0.9790021974,
119
  "token_f":0.9777290092,
120
- "pos_acc":0.9749672775,
121
  "morph_acc":0.0,
122
  "morph_micro_p":0.3401360544,
123
  "morph_micro_r":0.9803921569,
@@ -139,81 +139,81 @@
139
  "f":0.0
140
  }
141
  },
142
- "sents_p":0.9555984556,
143
- "sents_r":0.9763313609,
144
- "sents_f":0.9658536585,
145
- "dep_uas":0.9233540485,
146
- "dep_las":0.9101052821,
147
  "dep_las_per_type":{
148
  "cc":{
149
- "p":0.7826086957,
150
- "r":0.75,
151
- "f":0.7659574468
152
  },
153
  "compound":{
154
- "p":0.9399066511,
155
- "r":0.9081172492,
156
- "f":0.9237385321
157
  },
158
  "obl":{
159
- "p":0.8310038119,
160
- "r":0.8164794007,
161
- "f":0.8236775819
162
  },
163
  "case":{
164
- "p":0.9907940161,
165
- "r":0.9813829787,
166
- "f":0.9860660431
167
  },
168
  "dislocated":{
169
- "p":0.5454545455,
170
- "r":0.4615384615,
171
- "f":0.5
172
  },
173
  "nsubj":{
174
- "p":0.8359073359,
175
- "r":0.8310940499,
176
- "f":0.833493744
177
  },
178
  "nmod":{
179
- "p":0.8835192069,
180
- "r":0.8339181287,
181
- "f":0.8580024067
182
  },
183
  "root":{
184
- "p":0.9569471624,
185
  "r":0.9644970414,
186
- "f":0.9607072692
187
  },
188
  "aux":{
189
- "p":0.9796672828,
190
- "r":0.9842154132,
191
- "f":0.9819360815
192
  },
193
  "advcl":{
194
- "p":0.6888888889,
195
- "r":0.6966292135,
196
- "f":0.6927374302
197
  },
198
  "mark":{
199
- "p":0.9777777778,
200
- "r":0.968,
201
- "f":0.9728643216
202
  },
203
  "fixed":{
204
- "p":0.9621621622,
205
- "r":0.9709090909,
206
- "f":0.9665158371
207
  },
208
  "acl":{
209
- "p":0.8422222222,
210
- "r":0.832967033,
211
- "f":0.8375690608
212
  },
213
  "obj":{
214
- "p":0.9476923077,
215
- "r":0.9305135952,
216
- "f":0.9390243902
217
  },
218
  "nummod":{
219
  "p":0.9805194805,
@@ -221,34 +221,34 @@
221
  "f":0.9349845201
222
  },
223
  "advmod":{
224
- "p":0.6739130435,
225
- "r":0.6642857143,
226
- "f":0.6690647482
227
  },
228
  "amod":{
229
- "p":0.8709677419,
230
  "r":0.7297297297,
231
- "f":0.7941176471
232
  },
233
  "cop":{
234
- "p":0.9640718563,
235
- "r":0.9360465116,
236
- "f":0.9498525074
237
  },
238
  "ccomp":{
239
- "p":1.0,
240
- "r":0.9545454545,
241
- "f":0.976744186
242
  },
243
  "det":{
244
- "p":1.0,
245
- "r":0.9811320755,
246
- "f":0.9904761905
247
  },
248
  "csubj":{
249
- "p":0.6153846154,
250
- "r":0.6666666667,
251
- "f":0.64
252
  },
253
  "dep":{
254
  "p":0.25,
@@ -256,101 +256,101 @@
256
  "f":0.1818181818
257
  }
258
  },
259
- "tag_acc":0.9712488769,
260
  "lemma_acc":0.9670526831,
261
- "ents_p":0.754691689,
262
- "ents_r":0.7081761006,
263
- "ents_f":0.7306943543,
264
  "ents_per_type":{
265
  "DATE":{
266
- "p":0.9363636364,
267
- "r":0.9449541284,
268
- "f":0.9406392694
269
  },
270
  "ORG":{
271
- "p":0.6456692913,
272
- "r":0.598540146,
273
- "f":0.6212121212
274
  },
275
  "PERSON":{
276
- "p":0.7666666667,
277
- "r":0.8273381295,
278
- "f":0.7958477509
279
  },
280
  "GPE":{
281
- "p":0.7386363636,
282
  "r":0.6914893617,
283
- "f":0.7142857143
284
  },
285
  "TIME":{
286
- "p":0.5,
287
  "r":1.0,
288
- "f":0.6666666667
289
  },
290
  "QUANTITY":{
291
- "p":0.8923076923,
292
- "r":0.8787878788,
293
- "f":0.8854961832
294
  },
295
  "NORP":{
296
- "p":0.7037037037,
297
  "r":0.59375,
298
- "f":0.6440677966
299
  },
300
  "TITLE_AFFIX":{
301
- "p":0.8,
302
- "r":0.6666666667,
303
- "f":0.7272727273
304
  },
305
  "ORDINAL":{
306
- "p":0.5652173913,
307
- "r":0.5909090909,
308
- "f":0.5777777778
309
  },
310
  "WORK_OF_ART":{
311
- "p":0.75,
312
- "r":0.7058823529,
313
- "f":0.7272727273
314
  },
315
  "CARDINAL":{
316
- "p":0.5,
317
  "r":0.5,
318
- "f":0.5
319
  },
320
- "FAC":{
321
  "p":0.6666666667,
322
- "r":0.4324324324,
323
- "f":0.5245901639
324
  },
325
  "EVENT":{
326
- "p":0.6956521739,
327
- "r":0.6153846154,
328
- "f":0.6530612245
329
- },
330
- "PERCENT":{
331
- "p":1.0,
332
- "r":0.2857142857,
333
- "f":0.4444444444
334
  },
335
  "LOC":{
336
- "p":0.75,
337
- "r":0.9,
338
- "f":0.8181818182
339
  },
340
- "PRODUCT":{
341
- "p":0.5384615385,
342
- "r":0.3333333333,
343
- "f":0.4117647059
344
  },
345
  "MOVEMENT":{
346
  "p":0.0,
347
  "r":0.0,
348
  "f":0.0
349
  },
 
 
 
 
 
350
  "LAW":{
351
- "p":1.0,
352
- "r":0.3333333333,
353
- "f":0.5
354
  },
355
  "MONEY":{
356
  "p":1.0,
@@ -361,14 +361,9 @@
361
  "p":1.0,
362
  "r":1.0,
363
  "f":1.0
364
- },
365
- "PET_NAME":{
366
- "p":0.0,
367
- "r":0.0,
368
- "f":0.0
369
  }
370
  },
371
- "speed":9928.6122863321
372
  },
373
  "sources":[
374
  {
 
1
  {
2
  "lang":"ja",
3
  "name":"core_news_lg",
4
+ "version":"3.6.0",
5
  "description":"Japanese pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, senter, ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
+ "spacy_version":">=3.6.0,<3.7.0",
11
+ "spacy_git_version":"cb4fdc83e",
12
  "vectors":{
13
  "width":300,
14
  "vectors":480443,
 
117
  "token_p":0.9764591282,
118
  "token_r":0.9790021974,
119
  "token_f":0.9777290092,
120
+ "pos_acc":0.9730437272,
121
  "morph_acc":0.0,
122
  "morph_micro_p":0.3401360544,
123
  "morph_micro_r":0.9803921569,
 
139
  "f":0.0
140
  }
141
  },
142
+ "sents_p":0.9631782946,
143
+ "sents_r":0.9802761341,
144
+ "sents_f":0.9716520039,
145
+ "dep_uas":0.9221626975,
146
+ "dep_las":0.9081013,
147
  "dep_las_per_type":{
148
  "cc":{
149
+ "p":0.847826087,
150
+ "r":0.8125,
151
+ "f":0.829787234
152
  },
153
  "compound":{
154
+ "p":0.9406976744,
155
+ "r":0.9120631342,
156
+ "f":0.9261591299
157
  },
158
  "obl":{
159
+ "p":0.8122653317,
160
+ "r":0.8102372035,
161
+ "f":0.81125
162
  },
163
  "case":{
164
+ "p":0.990403071,
165
+ "r":0.9802431611,
166
+ "f":0.9852969257
167
  },
168
  "dislocated":{
169
+ "p":0.5882352941,
170
+ "r":0.7692307692,
171
+ "f":0.6666666667
172
  },
173
  "nsubj":{
174
+ "p":0.8307392996,
175
+ "r":0.8195777351,
176
+ "f":0.8251207729
177
  },
178
  "nmod":{
179
+ "p":0.8955974843,
180
+ "r":0.832748538,
181
+ "f":0.863030303
182
  },
183
  "root":{
184
+ "p":0.9607072692,
185
  "r":0.9644970414,
186
+ "f":0.9625984252
187
  },
188
  "aux":{
189
+ "p":0.9832713755,
190
+ "r":0.982358403,
191
+ "f":0.9828146772
192
  },
193
  "advcl":{
194
+ "p":0.6614349776,
195
+ "r":0.6629213483,
196
+ "f":0.6621773288
197
  },
198
  "mark":{
199
+ "p":0.9658634538,
200
+ "r":0.962,
201
+ "f":0.9639278557
202
  },
203
  "fixed":{
204
+ "p":0.9550359712,
205
+ "r":0.9654545455,
206
+ "f":0.9602169982
207
  },
208
  "acl":{
209
+ "p":0.8377192982,
210
+ "r":0.8395604396,
211
+ "f":0.8386388584
212
  },
213
  "obj":{
214
+ "p":0.9661538462,
215
+ "r":0.9486404834,
216
+ "f":0.9573170732
217
  },
218
  "nummod":{
219
  "p":0.9805194805,
 
221
  "f":0.9349845201
222
  },
223
  "advmod":{
224
+ "p":0.6474820144,
225
+ "r":0.6428571429,
226
+ "f":0.6451612903
227
  },
228
  "amod":{
229
+ "p":0.9,
230
  "r":0.7297297297,
231
+ "f":0.8059701493
232
  },
233
  "cop":{
234
+ "p":0.9467455621,
235
+ "r":0.9302325581,
236
+ "f":0.9384164223
237
  },
238
  "ccomp":{
239
+ "p":0.95,
240
+ "r":0.8636363636,
241
+ "f":0.9047619048
242
  },
243
  "det":{
244
+ "p":0.9807692308,
245
+ "r":0.9622641509,
246
+ "f":0.9714285714
247
  },
248
  "csubj":{
249
+ "p":0.6666666667,
250
+ "r":0.8333333333,
251
+ "f":0.7407407407
252
  },
253
  "dep":{
254
  "p":0.25,
 
256
  "f":0.1818181818
257
  }
258
  },
259
+ "tag_acc":0.9713305562,
260
  "lemma_acc":0.9670526831,
261
+ "ents_p":0.749661705,
262
+ "ents_r":0.6968553459,
263
+ "ents_f":0.7222946545,
264
  "ents_per_type":{
265
  "DATE":{
266
+ "p":0.9459459459,
267
+ "r":0.9633027523,
268
+ "f":0.9545454545
269
  },
270
  "ORG":{
271
+ "p":0.6209677419,
272
+ "r":0.5620437956,
273
+ "f":0.5900383142
274
  },
275
  "PERSON":{
276
+ "p":0.7622377622,
277
+ "r":0.7841726619,
278
+ "f":0.7730496454
279
  },
280
  "GPE":{
281
+ "p":0.7738095238,
282
  "r":0.6914893617,
283
+ "f":0.7303370787
284
  },
285
  "TIME":{
286
+ "p":0.5714285714,
287
  "r":1.0,
288
+ "f":0.7272727273
289
  },
290
  "QUANTITY":{
291
+ "p":0.921875,
292
+ "r":0.8939393939,
293
+ "f":0.9076923077
294
  },
295
  "NORP":{
296
+ "p":0.6785714286,
297
  "r":0.59375,
298
+ "f":0.6333333333
299
  },
300
  "TITLE_AFFIX":{
301
+ "p":0.72,
302
+ "r":0.6,
303
+ "f":0.6545454545
304
  },
305
  "ORDINAL":{
306
+ "p":0.6,
307
+ "r":0.6818181818,
308
+ "f":0.6382978723
309
  },
310
  "WORK_OF_ART":{
311
+ "p":0.7857142857,
312
+ "r":0.6470588235,
313
+ "f":0.7096774194
314
  },
315
  "CARDINAL":{
316
+ "p":1.0,
317
  "r":0.5,
318
+ "f":0.6666666667
319
  },
320
+ "PERCENT":{
321
  "p":0.6666666667,
322
+ "r":0.2857142857,
323
+ "f":0.4
324
  },
325
  "EVENT":{
326
+ "p":0.7894736842,
327
+ "r":0.5769230769,
328
+ "f":0.6666666667
 
 
 
 
 
329
  },
330
  "LOC":{
331
+ "p":0.5333333333,
332
+ "r":0.8,
333
+ "f":0.64
334
  },
335
+ "FAC":{
336
+ "p":0.5862068966,
337
+ "r":0.4594594595,
338
+ "f":0.5151515152
339
  },
340
  "MOVEMENT":{
341
  "p":0.0,
342
  "r":0.0,
343
  "f":0.0
344
  },
345
+ "PRODUCT":{
346
+ "p":0.5517241379,
347
+ "r":0.380952381,
348
+ "f":0.4507042254
349
+ },
350
  "LAW":{
351
+ "p":0.0,
352
+ "r":0.0,
353
+ "f":0.0
354
  },
355
  "MONEY":{
356
  "p":1.0,
 
361
  "p":1.0,
362
  "r":1.0,
363
  "f":1.0
 
 
 
 
 
364
  }
365
  },
366
+ "speed":8423.8901639919
367
  },
368
  "sources":[
369
  {
morphologizer/cfg CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "extend":true,
 
3
  "labels_morph":{
4
  "POS=NOUN":"",
5
  "POS=ADP":"",
 
1
  {
2
  "extend":true,
3
+ "label_smoothing":0.0,
4
  "labels_morph":{
5
  "POS=NOUN":"",
6
  "POS=ADP":"",
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8d23551cf53ffa3585e26fc8e06d3e3a7265b8ad7a73f8a63b8eee2bf42f78b
3
  size 8189
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba73a5fc52c85cdae9dc748b9c766dc9eeb6d942ea37d356696ba4022ef6f427
3
  size 8189
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58802755429b2dc7306702fa82fe1c85080c286173b95fa1afed63bde43c2403
3
  size 6385103
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1d7f76c9f06478c318b77405f45c9985bc96fa0b9c6457cdd125149f8515de0
3
  size 6385103
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e216c21ed16e491746e35ff4f12cef0d1ca23442bbf6554e269fef6f6785a0c4
3
  size 299888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b0a2af074bd3ab6412614938c3ee3448413d2104fee916d70364ac0db9c07c5
3
  size 299888
senter/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e72d004aa89e236df87ab02681650d2e964e53711fd8b20822c52fa91648c4c
3
  size 213263
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:125a7ab7d66fbd2d7b2aefd2cdc02d3954af055fe33da4a8b470141e00e9d58d
3
  size 213263
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ad60f2fd971cbf79314623752998752df0952bde7227145ff6491777747dd08
3
  size 6365607
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e3b80a1c0c76e3aaa1c597fe45d6eed8585b48c8a49bd2c7ea19d3911a122f
3
  size 6365607
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a947c6843c5d34ba6cc46d45c3e198363bfa9f0e9385b21ec04468ebe7e810b
3
- size 15614147
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f67c86d2bc7e7798c79b7bee36f353eecfafd604e6133471cc5409c0f22dc34
3
+ size 15613833