adrianeboyd commited on
Commit
ff7fd35
1 Parent(s): 8ea0943

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,49 +14,49 @@ model-index:
14
  metrics:
15
  - name: TAG (XPOS) Accuracy
16
  type: accuracy
17
- value: 0.9577726218
18
  - task:
19
  name: POS
20
  type: token-classification
21
  metrics:
22
  - name: POS (UPOS) Accuracy
23
  type: accuracy
24
- value: 0.9868522815
25
  - task:
26
  name: MORPH
27
  type: token-classification
28
  metrics:
29
  - name: Morph (UFeats) Accuracy
30
  type: accuracy
31
- value: 0.9794319295
32
  - task:
33
  name: LEMMA
34
  type: token-classification
35
  metrics:
36
  - name: Lemma Accuracy
37
  type: accuracy
38
- value: 0.9122482532
39
  - task:
40
  name: UNLABELED_DEPENDENCIES
41
  type: token-classification
42
  metrics:
43
  - name: Unlabeled Attachment Score (UAS)
44
  type: f_score
45
- value: 0.946357271
46
  - task:
47
  name: LABELED_DEPENDENCIES
48
  type: token-classification
49
  metrics:
50
  - name: Labeled Attachment Score (LAS)
51
  type: f_score
52
- value: 0.9249725227
53
  - task:
54
  name: SENTS
55
  type: token-classification
56
  metrics:
57
  - name: Sentences F-Score
58
  type: f_score
59
- value: 0.9447115385
60
  ---
61
  ### Details: https://spacy.io/models/fr#fr_dep_news_trf
62
 
@@ -65,8 +65,8 @@ French transformer pipeline (camembert-base). Components: transformer, morpholog
65
  | Feature | Description |
66
  | --- | --- |
67
  | **Name** | `fr_dep_news_trf` |
68
- | **Version** | `3.4.0` |
69
- | **spaCy** | `>=3.4.0,<3.5.0` |
70
  | **Default Pipeline** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `lemmatizer` |
71
  | **Components** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `lemmatizer` |
72
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -91,19 +91,19 @@ French transformer pipeline (camembert-base). Components: transformer, morpholog
91
 
92
  | Type | Score |
93
  | --- | --- |
94
- | `TOKEN_ACC` | 99.90 |
95
  | `TOKEN_P` | 98.44 |
96
  | `TOKEN_R` | 98.96 |
97
  | `TOKEN_F` | 98.70 |
98
- | `POS_ACC` | 98.69 |
99
- | `MORPH_ACC` | 97.94 |
100
- | `MORPH_MICRO_P` | 99.37 |
101
- | `MORPH_MICRO_R` | 99.10 |
102
- | `MORPH_MICRO_F` | 99.23 |
103
- | `SENTS_P` | 93.57 |
104
- | `SENTS_R` | 95.39 |
105
- | `SENTS_F` | 94.47 |
106
- | `DEP_UAS` | 94.64 |
107
- | `DEP_LAS` | 92.50 |
108
- | `TAG_ACC` | 95.78 |
109
- | `LEMMA_ACC` | 91.22 |
14
  metrics:
15
  - name: TAG (XPOS) Accuracy
16
  type: accuracy
17
+ value: 0.9579788605
18
  - task:
19
  name: POS
20
  type: token-classification
21
  metrics:
22
  - name: POS (UPOS) Accuracy
23
  type: accuracy
24
+ value: 0.9870585202
25
  - task:
26
  name: MORPH
27
  type: token-classification
28
  metrics:
29
  - name: Morph (UFeats) Accuracy
30
  type: accuracy
31
+ value: 0.9784491648
32
  - task:
33
  name: LEMMA
34
  type: token-classification
35
  metrics:
36
  - name: Lemma Accuracy
37
  type: accuracy
38
+ value: 0.9167694205
39
  - task:
40
  name: UNLABELED_DEPENDENCIES
41
  type: token-classification
42
  metrics:
43
  - name: Unlabeled Attachment Score (UAS)
44
  type: f_score
45
+ value: 0.9441518606
46
  - task:
47
  name: LABELED_DEPENDENCIES
48
  type: token-classification
49
  metrics:
50
  - name: Labeled Attachment Score (LAS)
51
  type: f_score
52
+ value: 0.9235307728
53
  - task:
54
  name: SENTS
55
  type: token-classification
56
  metrics:
57
  - name: Sentences F-Score
58
  type: f_score
59
+ value: 0.9410348977
60
  ---
61
  ### Details: https://spacy.io/models/fr#fr_dep_news_trf
62
 
65
  | Feature | Description |
66
  | --- | --- |
67
  | **Name** | `fr_dep_news_trf` |
68
+ | **Version** | `3.5.0` |
69
+ | **spaCy** | `>=3.5.0,<3.6.0` |
70
  | **Default Pipeline** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `lemmatizer` |
71
  | **Components** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `lemmatizer` |
72
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
91
 
92
  | Type | Score |
93
  | --- | --- |
94
+ | `TOKEN_ACC` | 99.80 |
95
  | `TOKEN_P` | 98.44 |
96
  | `TOKEN_R` | 98.96 |
97
  | `TOKEN_F` | 98.70 |
98
+ | `POS_ACC` | 98.71 |
99
+ | `MORPH_ACC` | 97.84 |
100
+ | `MORPH_MICRO_P` | 99.36 |
101
+ | `MORPH_MICRO_R` | 99.01 |
102
+ | `MORPH_MICRO_F` | 99.19 |
103
+ | `SENTS_P` | 93.32 |
104
+ | `SENTS_R` | 94.90 |
105
+ | `SENTS_F` | 94.10 |
106
+ | `DEP_UAS` | 94.42 |
107
+ | `DEP_LAS` | 92.35 |
108
+ | `TAG_ACC` | 95.80 |
109
+ | `LEMMA_ACC` | 91.68 |
accuracy.json CHANGED
@@ -1,58 +1,58 @@
1
  {
2
- "token_acc": 0.9989751998,
3
  "token_p": 0.9844389844,
4
  "token_r": 0.9896058454,
5
  "token_f": 0.9870156531,
6
- "pos_acc": 0.9868522815,
7
- "morph_acc": 0.9794319295,
8
- "morph_micro_p": 0.9937076181,
9
- "morph_micro_r": 0.9909833069,
10
- "morph_micro_f": 0.9923435927,
11
  "morph_per_feat": {
12
  "Definite": {
13
- "p": 0.9985358712,
14
  "r": 0.995620438,
15
- "f": 0.9970760234
16
  },
17
  "Number": {
18
- "p": 0.9957533235,
19
- "r": 0.992820324,
20
- "f": 0.9942846608
21
  },
22
  "PronType": {
23
- "p": 0.9987138264,
24
- "r": 0.9936020473,
25
- "f": 0.9961513791
26
  },
27
  "Gender": {
28
- "p": 0.988974359,
29
- "r": 0.9856887299,
30
- "f": 0.987328811
31
  },
32
  "Mood": {
33
- "p": 0.9982238011,
34
- "r": 0.9982238011,
35
- "f": 0.9982238011
36
  },
37
  "Person": {
38
- "p": 0.9974779319,
39
- "r": 0.9949685535,
40
- "f": 0.9962216625
41
  },
42
  "Tense": {
43
- "p": 0.987854251,
44
- "r": 0.9969356486,
45
- "f": 0.9923741739
46
  },
47
  "VerbForm": {
48
- "p": 0.9917627677,
49
- "r": 0.9966887417,
50
- "f": 0.9942196532
51
  },
52
  "NumType": {
53
- "p": 1.0,
54
- "r": 0.9180887372,
55
- "f": 0.9572953737
56
  },
57
  "Reflex": {
58
  "p": 1.0,
@@ -60,9 +60,9 @@
60
  "f": 1.0
61
  },
62
  "Voice": {
63
- "p": 0.9327731092,
64
  "r": 0.9910714286,
65
- "f": 0.961038961
66
  },
67
  "Poss": {
68
  "p": 1.0,
@@ -75,21 +75,21 @@
75
  "f": 1.0
76
  }
77
  },
78
- "sents_p": 0.9357142857,
79
- "sents_r": 0.9538834951,
80
- "sents_f": 0.9447115385,
81
- "dep_uas": 0.946357271,
82
- "dep_las": 0.9249725227,
83
  "dep_las_per_type": {
84
  "det": {
85
- "p": 0.9887278583,
86
  "r": 0.9911218725,
87
- "f": 0.989923418
88
  },
89
  "nsubj": {
90
- "p": 0.9498806683,
91
- "r": 0.9590361446,
92
- "f": 0.9544364508
93
  },
94
  "aux:tense": {
95
  "p": 0.9609375,
@@ -97,154 +97,154 @@
97
  "f": 0.9723320158
98
  },
99
  "root": {
100
- "p": 0.9547619048,
101
- "r": 0.9733009709,
102
- "f": 0.9639423077
103
  },
104
  "obj": {
105
- "p": 0.9422492401,
106
- "r": 0.9198813056,
107
- "f": 0.9309309309
108
  },
109
  "cc": {
110
- "p": 0.9406392694,
111
- "r": 0.9493087558,
112
- "f": 0.9449541284
113
  },
114
  "case": {
115
- "p": 0.9849931787,
116
- "r": 0.9836512262,
117
- "f": 0.9843217451
118
  },
119
  "obl:mod": {
120
- "p": 0.8163265306,
121
- "r": 0.8358208955,
122
- "f": 0.8259587021
123
  },
124
  "nmod": {
125
- "p": 0.9057171515,
126
- "r": 0.9020979021,
127
- "f": 0.9039039039
128
  },
129
  "conj": {
130
- "p": 0.7557251908,
131
- "r": 0.7795275591,
132
- "f": 0.7674418605
133
  },
134
  "nummod": {
135
- "p": 0.9074074074,
136
- "r": 0.8698224852,
137
- "f": 0.8882175227
138
  },
139
  "amod": {
140
- "p": 0.9522058824,
141
- "r": 0.9435336976,
142
- "f": 0.9478499543
143
  },
144
  "acl": {
145
- "p": 0.8612716763,
146
- "r": 0.8612716763,
147
- "f": 0.8612716763
148
  },
149
  "mark": {
150
- "p": 0.9603524229,
151
- "r": 0.9603524229,
152
- "f": 0.9603524229
153
  },
154
  "xcomp": {
155
- "p": 0.9044585987,
156
- "r": 0.940397351,
157
- "f": 0.9220779221
158
  },
159
  "flat:name": {
160
- "p": 0.9622641509,
161
- "r": 0.9714285714,
162
- "f": 0.9668246445
163
  },
164
  "cop": {
165
- "p": 0.9659090909,
166
- "r": 0.9444444444,
167
- "f": 0.9550561798
168
  },
169
  "advmod": {
170
- "p": 0.9326923077,
171
- "r": 0.9122257053,
172
- "f": 0.9223454834
173
  },
174
  "obl:arg": {
175
- "p": 0.9061032864,
176
- "r": 0.8772727273,
177
- "f": 0.8914549654
178
  },
179
  "appos": {
180
- "p": 0.6785714286,
181
- "r": 0.686746988,
182
- "f": 0.6826347305
183
  },
184
  "nsubj:pass": {
185
- "p": 0.9879518072,
186
- "r": 0.9647058824,
187
- "f": 0.9761904762
188
  },
189
  "aux:pass": {
190
- "p": 0.982300885,
191
  "r": 0.9910714286,
192
- "f": 0.9866666667
193
  },
194
  "acl:relcl": {
195
- "p": 0.7954545455,
196
  "r": 0.8139534884,
197
- "f": 0.8045977011
198
  },
199
  "advcl": {
200
- "p": 0.7142857143,
201
- "r": 0.7692307692,
202
- "f": 0.7407407407
203
  },
204
  "fixed": {
205
- "p": 0.9294117647,
206
- "r": 0.79,
207
- "f": 0.8540540541
208
  },
209
  "dep": {
210
- "p": 0.2711864407,
211
  "r": 0.5517241379,
212
- "f": 0.3636363636
213
  },
214
  "expl:subj": {
215
- "p": 0.8181818182,
216
- "r": 0.84375,
217
- "f": 0.8307692308
218
  },
219
  "expl:comp": {
220
- "p": 0.7435897436,
221
- "r": 0.9666666667,
222
- "f": 0.8405797101
223
  },
224
  "expl:pass": {
225
- "p": 0.75,
226
  "r": 0.4285714286,
227
- "f": 0.5454545455
228
  },
229
  "obl:agent": {
230
- "p": 0.9285714286,
231
- "r": 0.9285714286,
232
- "f": 0.9285714286
233
  },
234
  "ccomp": {
235
- "p": 0.96,
236
  "r": 0.9411764706,
237
- "f": 0.9504950495
238
  },
239
  "parataxis": {
240
- "p": 0.6923076923,
241
  "r": 0.6428571429,
242
- "f": 0.6666666667
243
  },
244
  "iobj": {
245
- "p": 0.8235294118,
246
- "r": 0.56,
247
- "f": 0.6666666667
248
  },
249
  "nsubj:caus": {
250
  "p": 0.0,
@@ -277,9 +277,9 @@
277
  "f": 0.0
278
  },
279
  "flat:foreign": {
280
- "p": 0.5,
281
- "r": 0.1428571429,
282
- "f": 0.2222222222
283
  },
284
  "orphan": {
285
  "p": 0.0,
@@ -297,7 +297,7 @@
297
  "f": 0.0
298
  }
299
  },
300
- "tag_acc": 0.9577726218,
301
- "lemma_acc": 0.9122482532,
302
- "speed": 3069.1330090473
303
  }
1
  {
2
+ "token_acc": 0.997952498,
3
  "token_p": 0.9844389844,
4
  "token_r": 0.9896058454,
5
  "token_f": 0.9870156531,
6
+ "pos_acc": 0.9870585202,
7
+ "morph_acc": 0.9784491648,
8
+ "morph_micro_p": 0.9936410884,
9
+ "morph_micro_r": 0.9900694529,
10
+ "morph_micro_f": 0.9918520553,
11
  "morph_per_feat": {
12
  "Definite": {
13
+ "p": 0.9992673993,
14
  "r": 0.995620438,
15
+ "f": 0.997440585
16
  },
17
  "Number": {
18
+ "p": 0.9957517547,
19
+ "r": 0.9924521355,
20
+ "f": 0.9940992071
21
  },
22
  "PronType": {
23
+ "p": 0.999356085,
24
+ "r": 0.9929622521,
25
+ "f": 0.9961489089
26
  },
27
  "Gender": {
28
+ "p": 0.9876859928,
29
+ "r": 0.9838998211,
30
+ "f": 0.9857892715
31
  },
32
  "Mood": {
33
+ "p": 0.9982206406,
34
+ "r": 0.9964476021,
35
+ "f": 0.9973333333
36
  },
37
  "Person": {
38
+ "p": 0.9962121212,
39
+ "r": 0.9924528302,
40
+ "f": 0.9943289225
41
  },
42
  "Tense": {
43
+ "p": 0.9878296146,
44
+ "r": 0.9948927477,
45
+ "f": 0.9913486005
46
  },
47
  "VerbForm": {
48
+ "p": 0.9917491749,
49
+ "r": 0.9950331126,
50
+ "f": 0.9933884298
51
  },
52
  "NumType": {
53
+ "p": 0.9963235294,
54
+ "r": 0.9249146758,
55
+ "f": 0.9592920354
56
  },
57
  "Reflex": {
58
  "p": 1.0,
60
  "f": 1.0
61
  },
62
  "Voice": {
63
+ "p": 0.9652173913,
64
  "r": 0.9910714286,
65
+ "f": 0.9779735683
66
  },
67
  "Poss": {
68
  "p": 1.0,
75
  "f": 1.0
76
  }
77
  },
78
+ "sents_p": 0.9331742243,
79
+ "sents_r": 0.9490291262,
80
+ "sents_f": 0.9410348977,
81
+ "dep_uas": 0.9441518606,
82
+ "dep_las": 0.9235307728,
83
  "dep_las_per_type": {
84
  "det": {
85
+ "p": 0.9879324216,
86
  "r": 0.9911218725,
87
+ "f": 0.989524577
88
  },
89
  "nsubj": {
90
+ "p": 0.9427207637,
91
+ "r": 0.9518072289,
92
+ "f": 0.9472422062
93
  },
94
  "aux:tense": {
95
  "p": 0.9609375,
97
  "f": 0.9723320158
98
  },
99
  "root": {
100
+ "p": 0.9429928741,
101
+ "r": 0.963592233,
102
+ "f": 0.9531812725
103
  },
104
  "obj": {
105
+ "p": 0.9537037037,
106
+ "r": 0.9169139466,
107
+ "f": 0.9349470499
108
  },
109
  "cc": {
110
+ "p": 0.9539170507,
111
+ "r": 0.9539170507,
112
+ "f": 0.9539170507
113
  },
114
  "case": {
115
+ "p": 0.9863852961,
116
+ "r": 0.9870572207,
117
+ "f": 0.986721144
118
  },
119
  "obl:mod": {
120
+ "p": 0.8126888218,
121
+ "r": 0.8029850746,
122
+ "f": 0.8078078078
123
  },
124
  "nmod": {
125
+ "p": 0.8984924623,
126
+ "r": 0.8931068931,
127
+ "f": 0.8957915832
128
  },
129
  "conj": {
130
+ "p": 0.7707509881,
131
+ "r": 0.7677165354,
132
+ "f": 0.7692307692
133
  },
134
  "nummod": {
135
+ "p": 0.921686747,
136
+ "r": 0.9053254438,
137
+ "f": 0.9134328358
138
  },
139
  "amod": {
140
+ "p": 0.9611829945,
141
+ "r": 0.9471766849,
142
+ "f": 0.9541284404
143
  },
144
  "acl": {
145
+ "p": 0.8222222222,
146
+ "r": 0.8554913295,
147
+ "f": 0.8385269122
148
  },
149
  "mark": {
150
+ "p": 0.9733333333,
151
+ "r": 0.9647577093,
152
+ "f": 0.9690265487
153
  },
154
  "xcomp": {
155
+ "p": 0.898089172,
156
+ "r": 0.9337748344,
157
+ "f": 0.9155844156
158
  },
159
  "flat:name": {
160
+ "p": 0.9363636364,
161
+ "r": 0.980952381,
162
+ "f": 0.9581395349
163
  },
164
  "cop": {
165
+ "p": 0.9555555556,
166
+ "r": 0.9555555556,
167
+ "f": 0.9555555556
168
  },
169
  "advmod": {
170
+ "p": 0.9483870968,
171
+ "r": 0.921630094,
172
+ "f": 0.9348171701
173
  },
174
  "obl:arg": {
175
+ "p": 0.8818181818,
176
+ "r": 0.8818181818,
177
+ "f": 0.8818181818
178
  },
179
  "appos": {
180
+ "p": 0.6666666667,
181
+ "r": 0.6987951807,
182
+ "f": 0.6823529412
183
  },
184
  "nsubj:pass": {
185
+ "p": 0.987804878,
186
+ "r": 0.9529411765,
187
+ "f": 0.9700598802
188
  },
189
  "aux:pass": {
190
+ "p": 0.9910714286,
191
  "r": 0.9910714286,
192
+ "f": 0.9910714286
193
  },
194
  "acl:relcl": {
195
+ "p": 0.8235294118,
196
  "r": 0.8139534884,
197
+ "f": 0.8187134503
198
  },
199
  "advcl": {
200
+ "p": 0.7,
201
+ "r": 0.7179487179,
202
+ "f": 0.7088607595
203
  },
204
  "fixed": {
205
+ "p": 0.9090909091,
206
+ "r": 0.8,
207
+ "f": 0.8510638298
208
  },
209
  "dep": {
210
+ "p": 0.253968254,
211
  "r": 0.5517241379,
212
+ "f": 0.347826087
213
  },
214
  "expl:subj": {
215
+ "p": 0.875,
216
+ "r": 0.875,
217
+ "f": 0.875
218
  },
219
  "expl:comp": {
220
+ "p": 0.7368421053,
221
+ "r": 0.9333333333,
222
+ "f": 0.8235294118
223
  },
224
  "expl:pass": {
225
+ "p": 0.5,
226
  "r": 0.4285714286,
227
+ "f": 0.4615384615
228
  },
229
  "obl:agent": {
230
+ "p": 0.95,
231
+ "r": 0.9047619048,
232
+ "f": 0.9268292683
233
  },
234
  "ccomp": {
235
+ "p": 0.9411764706,
236
  "r": 0.9411764706,
237
+ "f": 0.9411764706
238
  },
239
  "parataxis": {
240
+ "p": 0.6428571429,
241
  "r": 0.6428571429,
242
+ "f": 0.6428571429
243
  },
244
  "iobj": {
245
+ "p": 0.7894736842,
246
+ "r": 0.6,
247
+ "f": 0.6818181818
248
  },
249
  "nsubj:caus": {
250
  "p": 0.0,
277
  "f": 0.0
278
  },
279
  "flat:foreign": {
280
+ "p": 0.6666666667,
281
+ "r": 0.5714285714,
282
+ "f": 0.6153846154
283
  },
284
  "orphan": {
285
  "p": 0.0,
297
  "f": 0.0
298
  }
299
  },
300
+ "tag_acc": 0.9579788605,
301
+ "lemma_acc": 0.9167694205,
302
+ "speed": 2617.175124839
303
  }
attribute_ruler/patterns CHANGED
Binary files a/attribute_ruler/patterns and b/attribute_ruler/patterns differ
config.cfg CHANGED
@@ -121,11 +121,12 @@ dropout = 0.1
121
  accumulate_gradient = 3
122
  patience = 5000
123
  max_epochs = 0
124
- max_steps = 16000
125
  eval_frequency = 1000
126
  frozen_components = []
127
  before_to_disk = null
128
  annotating_components = []
 
129
 
130
  [training.batcher]
131
  @batchers = "spacy.batch_by_padded.v1"
121
  accumulate_gradient = 3
122
  patience = 5000
123
  max_epochs = 0
124
+ max_steps = 20000
125
  eval_frequency = 1000
126
  frozen_components = []
127
  before_to_disk = null
128
  annotating_components = []
129
+ before_update = null
130
 
131
  [training.batcher]
132
  @batchers = "spacy.batch_by_padded.v1"
fr_dep_news_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e724f775dec890cbb203f769b35864765ccc126d4dcc1fe1d01c91cd704319f3
3
- size 400751833
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c670005de650a9d1c6360e59cff832f85af5392d6396f01421670a1e74e0ab8f
3
+ size 400734236
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"fr",
3
  "name":"dep_news_trf",
4
- "version":"3.4.0",
5
  "description":"French transformer pipeline (camembert-base). Components: transformer, morphologizer, parser, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"LGPL-LR",
10
- "spacy_version":">=3.4.0,<3.5.0",
11
- "spacy_git_version":"dd038b536",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -280,60 +280,60 @@
280
 
281
  ],
282
  "performance":{
283
- "token_acc":0.9989751998,
284
  "token_p":0.9844389844,
285
  "token_r":0.9896058454,
286
  "token_f":0.9870156531,
287
- "pos_acc":0.9868522815,
288
- "morph_acc":0.9794319295,
289
- "morph_micro_p":0.9937076181,
290
- "morph_micro_r":0.9909833069,
291
- "morph_micro_f":0.9923435927,
292
  "morph_per_feat":{
293
  "Definite":{
294
- "p":0.9985358712,
295
  "r":0.995620438,
296
- "f":0.9970760234
297
  },
298
  "Number":{
299
- "p":0.9957533235,
300
- "r":0.992820324,
301
- "f":0.9942846608
302
  },
303
  "PronType":{
304
- "p":0.9987138264,
305
- "r":0.9936020473,
306
- "f":0.9961513791
307
  },
308
  "Gender":{
309
- "p":0.988974359,
310
- "r":0.9856887299,
311
- "f":0.987328811
312
  },
313
  "Mood":{
314
- "p":0.9982238011,
315
- "r":0.9982238011,
316
- "f":0.9982238011
317
  },
318
  "Person":{
319
- "p":0.9974779319,
320
- "r":0.9949685535,
321
- "f":0.9962216625
322
  },
323
  "Tense":{
324
- "p":0.987854251,
325
- "r":0.9969356486,
326
- "f":0.9923741739
327
  },
328
  "VerbForm":{
329
- "p":0.9917627677,
330
- "r":0.9966887417,
331
- "f":0.9942196532
332
  },
333
  "NumType":{
334
- "p":1.0,
335
- "r":0.9180887372,
336
- "f":0.9572953737
337
  },
338
  "Reflex":{
339
  "p":1.0,
@@ -341,9 +341,9 @@
341
  "f":1.0
342
  },
343
  "Voice":{
344
- "p":0.9327731092,
345
  "r":0.9910714286,
346
- "f":0.961038961
347
  },
348
  "Poss":{
349
  "p":1.0,
@@ -356,21 +356,21 @@
356
  "f":1.0
357
  }
358
  },
359
- "sents_p":0.9357142857,
360
- "sents_r":0.9538834951,
361
- "sents_f":0.9447115385,
362
- "dep_uas":0.946357271,
363
- "dep_las":0.9249725227,
364
  "dep_las_per_type":{
365
  "det":{
366
- "p":0.9887278583,
367
  "r":0.9911218725,
368
- "f":0.989923418
369
  },
370
  "nsubj":{
371
- "p":0.9498806683,
372
- "r":0.9590361446,
373
- "f":0.9544364508
374
  },
375
  "aux:tense":{
376
  "p":0.9609375,
@@ -378,154 +378,154 @@
378
  "f":0.9723320158
379
  },
380
  "root":{
381
- "p":0.9547619048,
382
- "r":0.9733009709,
383
- "f":0.9639423077
384
  },
385
  "obj":{
386
- "p":0.9422492401,
387
- "r":0.9198813056,
388
- "f":0.9309309309
389
  },
390
  "cc":{
391
- "p":0.9406392694,
392
- "r":0.9493087558,
393
- "f":0.9449541284
394
  },
395
  "case":{
396
- "p":0.9849931787,
397
- "r":0.9836512262,
398
- "f":0.9843217451
399
  },
400
  "obl:mod":{
401
- "p":0.8163265306,
402
- "r":0.8358208955,
403
- "f":0.8259587021
404
  },
405
  "nmod":{
406
- "p":0.9057171515,
407
- "r":0.9020979021,
408
- "f":0.9039039039
409
  },
410
  "conj":{
411
- "p":0.7557251908,
412
- "r":0.7795275591,
413
- "f":0.7674418605
414
  },
415
  "nummod":{
416
- "p":0.9074074074,
417
- "r":0.8698224852,
418
- "f":0.8882175227
419
  },
420
  "amod":{
421
- "p":0.9522058824,
422
- "r":0.9435336976,
423
- "f":0.9478499543
424
  },
425
  "acl":{
426
- "p":0.8612716763,
427
- "r":0.8612716763,
428
- "f":0.8612716763
429
  },
430
  "mark":{
431
- "p":0.9603524229,
432
- "r":0.9603524229,
433
- "f":0.9603524229
434
  },
435
  "xcomp":{
436
- "p":0.9044585987,
437
- "r":0.940397351,
438
- "f":0.9220779221
439
  },
440
  "flat:name":{
441
- "p":0.9622641509,
442
- "r":0.9714285714,
443
- "f":0.9668246445
444
  },
445
  "cop":{
446
- "p":0.9659090909,
447
- "r":0.9444444444,
448
- "f":0.9550561798
449
  },
450
  "advmod":{
451
- "p":0.9326923077,
452
- "r":0.9122257053,
453
- "f":0.9223454834
454
  },
455
  "obl:arg":{
456
- "p":0.9061032864,
457
- "r":0.8772727273,
458
- "f":0.8914549654
459
  },
460
  "appos":{
461
- "p":0.6785714286,
462
- "r":0.686746988,
463
- "f":0.6826347305
464
  },
465
  "nsubj:pass":{
466
- "p":0.9879518072,
467
- "r":0.9647058824,
468
- "f":0.9761904762
469
  },
470
  "aux:pass":{
471
- "p":0.982300885,
472
  "r":0.9910714286,
473
- "f":0.9866666667
474
  },
475
  "acl:relcl":{
476
- "p":0.7954545455,
477
  "r":0.8139534884,
478
- "f":0.8045977011
479
  },
480
  "advcl":{
481
- "p":0.7142857143,
482
- "r":0.7692307692,
483
- "f":0.7407407407
484
  },
485
  "fixed":{
486
- "p":0.9294117647,
487
- "r":0.79,
488
- "f":0.8540540541
489
  },
490
  "dep":{
491
- "p":0.2711864407,
492
  "r":0.5517241379,
493
- "f":0.3636363636
494
  },
495
  "expl:subj":{
496
- "p":0.8181818182,
497
- "r":0.84375,
498
- "f":0.8307692308
499
  },
500
  "expl:comp":{
501
- "p":0.7435897436,
502
- "r":0.9666666667,
503
- "f":0.8405797101
504
  },
505
  "expl:pass":{
506
- "p":0.75,
507
  "r":0.4285714286,
508
- "f":0.5454545455
509
  },
510
  "obl:agent":{
511
- "p":0.9285714286,
512
- "r":0.9285714286,
513
- "f":0.9285714286
514
  },
515
  "ccomp":{
516
- "p":0.96,
517
  "r":0.9411764706,
518
- "f":0.9504950495
519
  },
520
  "parataxis":{
521
- "p":0.6923076923,
522
  "r":0.6428571429,
523
- "f":0.6666666667
524
  },
525
  "iobj":{
526
- "p":0.8235294118,
527
- "r":0.56,
528
- "f":0.6666666667
529
  },
530
  "nsubj:caus":{
531
  "p":0.0,
@@ -558,9 +558,9 @@
558
  "f":0.0
559
  },
560
  "flat:foreign":{
561
- "p":0.5,
562
- "r":0.1428571429,
563
- "f":0.2222222222
564
  },
565
  "orphan":{
566
  "p":0.0,
@@ -578,9 +578,9 @@
578
  "f":0.0
579
  }
580
  },
581
- "tag_acc":0.9577726218,
582
- "lemma_acc":0.9122482532,
583
- "speed":3069.1330090473
584
  },
585
  "sources":[
586
  {
@@ -603,8 +603,8 @@
603
  }
604
  ],
605
  "requirements":[
606
- "spacy-transformers>=1.1.2,<1.2.0",
607
  "sentencepiece>=0.1.91,!=0.1.92",
608
- "protobuf"
609
  ]
610
  }
1
  {
2
  "lang":"fr",
3
  "name":"dep_news_trf",
4
+ "version":"3.5.0",
5
  "description":"French transformer pipeline (camembert-base). Components: transformer, morphologizer, parser, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"LGPL-LR",
10
+ "spacy_version":">=3.5.0,<3.6.0",
11
+ "spacy_git_version":"9e0322de1",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
280
 
281
  ],
282
  "performance":{
283
+ "token_acc":0.997952498,
284
  "token_p":0.9844389844,
285
  "token_r":0.9896058454,
286
  "token_f":0.9870156531,
287
+ "pos_acc":0.9870585202,
288
+ "morph_acc":0.9784491648,
289
+ "morph_micro_p":0.9936410884,
290
+ "morph_micro_r":0.9900694529,
291
+ "morph_micro_f":0.9918520553,
292
  "morph_per_feat":{
293
  "Definite":{
294
+ "p":0.9992673993,
295
  "r":0.995620438,
296
+ "f":0.997440585
297
  },
298
  "Number":{
299
+ "p":0.9957517547,
300
+ "r":0.9924521355,
301
+ "f":0.9940992071
302
  },
303
  "PronType":{
304
+ "p":0.999356085,
305
+ "r":0.9929622521,
306
+ "f":0.9961489089
307
  },
308
  "Gender":{
309
+ "p":0.9876859928,
310
+ "r":0.9838998211,
311
+ "f":0.9857892715
312
  },
313
  "Mood":{
314
+ "p":0.9982206406,
315
+ "r":0.9964476021,
316
+ "f":0.9973333333
317
  },
318
  "Person":{
319
+ "p":0.9962121212,
320
+ "r":0.9924528302,
321
+ "f":0.9943289225
322
  },
323
  "Tense":{
324
+ "p":0.9878296146,
325
+ "r":0.9948927477,
326
+ "f":0.9913486005
327
  },
328
  "VerbForm":{
329
+ "p":0.9917491749,
330
+ "r":0.9950331126,
331
+ "f":0.9933884298
332
  },
333
  "NumType":{
334
+ "p":0.9963235294,
335
+ "r":0.9249146758,
336
+ "f":0.9592920354
337
  },
338
  "Reflex":{
339
  "p":1.0,
341
  "f":1.0
342
  },
343
  "Voice":{
344
+ "p":0.9652173913,
345
  "r":0.9910714286,
346
+ "f":0.9779735683
347
  },
348
  "Poss":{
349
  "p":1.0,
356
  "f":1.0
357
  }
358
  },
359
+ "sents_p":0.9331742243,
360
+ "sents_r":0.9490291262,
361
+ "sents_f":0.9410348977,
362
+ "dep_uas":0.9441518606,
363
+ "dep_las":0.9235307728,
364
  "dep_las_per_type":{
365
  "det":{
366
+ "p":0.9879324216,
367
  "r":0.9911218725,
368
+ "f":0.989524577
369
  },
370
  "nsubj":{
371
+ "p":0.9427207637,
372
+ "r":0.9518072289,
373
+ "f":0.9472422062
374
  },
375
  "aux:tense":{
376
  "p":0.9609375,
378
  "f":0.9723320158
379
  },
380
  "root":{
381
+ "p":0.9429928741,
382
+ "r":0.963592233,
383
+ "f":0.9531812725
384
  },
385
  "obj":{
386
+ "p":0.9537037037,
387
+ "r":0.9169139466,
388
+ "f":0.9349470499
389
  },
390
  "cc":{
391
+ "p":0.9539170507,
392
+ "r":0.9539170507,
393
+ "f":0.9539170507
394
  },
395
  "case":{
396
+ "p":0.9863852961,
397
+ "r":0.9870572207,
398
+ "f":0.986721144
399
  },
400
  "obl:mod":{
401
+ "p":0.8126888218,
402
+ "r":0.8029850746,
403
+ "f":0.8078078078
404
  },
405
  "nmod":{
406
+ "p":0.8984924623,
407
+ "r":0.8931068931,
408
+ "f":0.8957915832
409
  },
410
  "conj":{
411
+ "p":0.7707509881,
412
+ "r":0.7677165354,
413
+ "f":0.7692307692
414
  },
415
  "nummod":{
416
+ "p":0.921686747,
417
+ "r":0.9053254438,
418
+ "f":0.9134328358
419
  },
420
  "amod":{
421
+ "p":0.9611829945,
422
+ "r":0.9471766849,
423
+ "f":0.9541284404
424
  },
425
  "acl":{
426
+ "p":0.8222222222,
427
+ "r":0.8554913295,
428
+ "f":0.8385269122
429
  },
430
  "mark":{
431
+ "p":0.9733333333,
432
+ "r":0.9647577093,
433
+ "f":0.9690265487
434
  },
435
  "xcomp":{
436
+ "p":0.898089172,
437
+ "r":0.9337748344,
438
+ "f":0.9155844156
439
  },
440
  "flat:name":{
441
+ "p":0.9363636364,
442
+ "r":0.980952381,
443
+ "f":0.9581395349
444
  },
445
  "cop":{
446
+ "p":0.9555555556,
447
+ "r":0.9555555556,
448
+ "f":0.9555555556
449
  },
450
  "advmod":{
451
+ "p":0.9483870968,
452
+ "r":0.921630094,
453
+ "f":0.9348171701
454
  },
455
  "obl:arg":{
456
+ "p":0.8818181818,
457
+ "r":0.8818181818,
458
+ "f":0.8818181818
459
  },
460
  "appos":{
461
+ "p":0.6666666667,
462
+ "r":0.6987951807,
463
+ "f":0.6823529412
464
  },
465
  "nsubj:pass":{
466
+ "p":0.987804878,
467
+ "r":0.9529411765,
468
+ "f":0.9700598802
469
  },
470
  "aux:pass":{
471
+ "p":0.9910714286,
472
  "r":0.9910714286,
473
+ "f":0.9910714286
474
  },
475
  "acl:relcl":{
476
+ "p":0.8235294118,
477
  "r":0.8139534884,
478
+ "f":0.8187134503
479
  },
480
  "advcl":{
481
+ "p":0.7,
482
+ "r":0.7179487179,
483
+ "f":0.7088607595
484
  },
485
  "fixed":{
486
+ "p":0.9090909091,
487
+ "r":0.8,
488
+ "f":0.8510638298
489
  },
490
  "dep":{
491
+ "p":0.253968254,
492
  "r":0.5517241379,
493
+ "f":0.347826087
494
  },
495
  "expl:subj":{
496
+ "p":0.875,
497
+ "r":0.875,
498
+ "f":0.875
499
  },
500
  "expl:comp":{
501
+ "p":0.7368421053,
502
+ "r":0.9333333333,
503
+ "f":0.8235294118
504
  },
505
  "expl:pass":{
506
+ "p":0.5,
507
  "r":0.4285714286,
508
+ "f":0.4615384615
509
  },
510
  "obl:agent":{
511
+ "p":0.95,
512
+ "r":0.9047619048,
513
+ "f":0.9268292683
514
  },
515
  "ccomp":{
516
+ "p":0.9411764706,
517
  "r":0.9411764706,
518
+ "f":0.9411764706
519
  },
520
  "parataxis":{
521
+ "p":0.6428571429,
522
  "r":0.6428571429,
523
+ "f":0.6428571429
524
  },
525
  "iobj":{
526
+ "p":0.7894736842,
527
+ "r":0.6,
528
+ "f":0.6818181818
529
  },
530
  "nsubj:caus":{
531
  "p":0.0,
558
  "f":0.0
559
  },
560
  "flat:foreign":{
561
+ "p":0.6666666667,
562
+ "r":0.5714285714,
563
+ "f":0.6153846154
564
  },
565
  "orphan":{
566
  "p":0.0,
578
  "f":0.0
579
  }
580
  },
581
+ "tag_acc":0.9579788605,
582
+ "lemma_acc":0.9167694205,
583
+ "speed":2617.175124839
584
  },
585
  "sources":[
586
  {
603
  }
604
  ],
605
  "requirements":[
606
+ "spacy-transformers>=1.2.0.dev0,<1.3.0",
607
  "sentencepiece>=0.1.91,!=0.1.92",
608
+ "protobuf<3.21.0"
609
  ]
610
  }
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5196efecf684a7bcf2ea33010a07de29ea6b1a2a7b1620d300b3f91c1d39e74
3
  size 603544
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed7096edfd48947095556ff5540c26a2d9a98e76cfb2fcd15f59ead2228a1d8f
3
  size 603544
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b208fbd7836e561d18162e4d4a5cb2dd9dbe05e9e6c7d96b2ebeb67c34181e1b
3
  size 397805
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0b9a7efa99e378f1cab2940dca689328fee2c976b813793974325ecb0a1d6cf
3
  size 397805
tokenizer CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d399a4e4c03d3ff8f9f14701678b318876e8f6799c64e01f4d342fa86cf6ac3
3
- size 1515364
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c5994780fdf69912547eff13b24e61764efefae670274e56112354430afe0f4
3
+ size 1515440
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdf39ad8465f49e13e7206bccc5887a65abe5bc514bc3243743af20783c9dfbe
3
- size 445799779
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b735ea3057ad39dd636e4cea687feb786064d84b6475c6a4aec142d8d4ccfe4
3
+ size 445799975
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c592ac50c40dd04f00896e96ed0eed7b552ad94ea71476f54c0714da60ee293
3
- size 228600
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97ef211af70fba595843574fdd67f48f9683a67804bceca3df092c3d907fe6c3
3
+ size 228640