adrianeboyd commited on
Commit
c0f7334
1 Parent(s): 07168d0

Update spaCy pipeline

Browse files
Files changed (5) hide show
  1. README.md +7 -7
  2. accuracy.json +64 -64
  3. en_core_web_sm-any-py3-none-any.whl +2 -2
  4. meta.json +66 -66
  5. ner/model +1 -1
README.md CHANGED
@@ -14,13 +14,13 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.8565043157
18
  - name: NER Recall
19
  type: recall
20
- value: 0.8348858173
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.8455569081
24
  - task:
25
  name: TAG
26
  type: token-classification
@@ -57,7 +57,7 @@ English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter,
57
  | Feature | Description |
58
  | --- | --- |
59
  | **Name** | `en_core_web_sm` |
60
- | **Version** | `3.4.0` |
61
  | **spaCy** | `>=3.4.0,<3.5.0` |
62
  | **Default Pipeline** | `tok2vec`, `tagger`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
63
  | **Components** | `tok2vec`, `tagger`, `parser`, `senter`, `attribute_ruler`, `lemmatizer`, `ner` |
@@ -94,6 +94,6 @@ English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter,
94
  | `SENTS_F` | 90.39 |
95
  | `DEP_UAS` | 91.66 |
96
  | `DEP_LAS` | 89.78 |
97
- | `ENTS_P` | 85.65 |
98
- | `ENTS_R` | 83.49 |
99
- | `ENTS_F` | 84.56 |
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.8410860451
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.8439503205
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.8425157484
24
  - task:
25
  name: TAG
26
  type: token-classification
 
57
  | Feature | Description |
58
  | --- | --- |
59
  | **Name** | `en_core_web_sm` |
60
+ | **Version** | `3.4.1` |
61
  | **spaCy** | `>=3.4.0,<3.5.0` |
62
  | **Default Pipeline** | `tok2vec`, `tagger`, `parser`, `attribute_ruler`, `lemmatizer`, `ner` |
63
  | **Components** | `tok2vec`, `tagger`, `parser`, `senter`, `attribute_ruler`, `lemmatizer`, `ner` |
 
94
  | `SENTS_F` | 90.39 |
95
  | `DEP_UAS` | 91.66 |
96
  | `DEP_LAS` | 89.78 |
97
+ | `ENTS_P` | 84.11 |
98
+ | `ENTS_R` | 84.40 |
99
+ | `ENTS_F` | 84.25 |
accuracy.json CHANGED
@@ -231,100 +231,100 @@
231
  "f": 0.5714285714
232
  }
233
  },
234
- "ents_p": 0.8565043157,
235
- "ents_r": 0.8348858173,
236
- "ents_f": 0.8455569081,
237
  "ents_per_type": {
238
  "DATE": {
239
- "p": 0.8804768041,
240
- "r": 0.8676190476,
241
- "f": 0.8740006396
242
  },
243
  "GPE": {
244
- "p": 0.9239884393,
245
- "r": 0.8917712692,
246
- "f": 0.9075940383
247
  },
248
  "ORDINAL": {
249
- "p": 0.7910447761,
250
- "r": 0.8229813665,
251
- "f": 0.8066971081
252
  },
253
  "ORG": {
254
- "p": 0.8107606679,
255
- "r": 0.8109756098,
256
- "f": 0.8108681246
257
- },
258
- "FAC": {
259
- "p": 0.3902439024,
260
- "r": 0.3692307692,
261
- "f": 0.3794466403
262
  },
263
  "CARDINAL": {
264
- "p": 0.8266978923,
265
- "r": 0.8394768133,
266
- "f": 0.8330383481
 
 
 
 
 
267
  },
268
  "PERSON": {
269
- "p": 0.8648820905,
270
- "r": 0.885770235,
271
- "f": 0.8752015479
272
  },
273
  "NORP": {
274
- "p": 0.9130787977,
275
- "r": 0.8992,
276
- "f": 0.9060862555
277
  },
278
- "TIME": {
279
- "p": 0.7492163009,
280
- "r": 0.6988304094,
281
- "f": 0.7231467474
282
  },
283
- "LOC": {
284
- "p": 0.7158273381,
285
- "r": 0.6337579618,
286
- "f": 0.6722972973
287
  },
288
- "QUANTITY": {
289
- "p": 0.7971014493,
290
- "r": 0.6043956044,
291
- "f": 0.6875
292
  },
293
  "EVENT": {
294
- "p": 0.6373626374,
295
- "r": 0.3333333333,
296
- "f": 0.4377358491
297
  },
298
  "WORK_OF_ART": {
299
- "p": 0.5230769231,
300
- "r": 0.3505154639,
301
- "f": 0.4197530864
302
  },
303
  "LAW": {
304
- "p": 0.6304347826,
305
- "r": 0.453125,
306
- "f": 0.5272727273
307
  },
308
  "MONEY": {
309
- "p": 0.9179548157,
310
- "r": 0.9114521842,
311
- "f": 0.9146919431
312
- },
313
- "PERCENT": {
314
- "p": 0.9171974522,
315
- "r": 0.8820826953,
316
- "f": 0.8992974239
317
  },
318
  "PRODUCT": {
319
- "p": 0.5,
320
  "r": 0.2274881517,
321
- "f": 0.3127035831
 
 
 
 
 
322
  },
323
  "LANGUAGE": {
324
- "p": 0.8,
325
- "r": 0.625,
326
- "f": 0.701754386
327
  }
328
  },
329
- "speed": 9012.0225085527
330
  }
 
231
  "f": 0.5714285714
232
  }
233
  },
234
+ "ents_p": 0.8410860451,
235
+ "ents_r": 0.8439503205,
236
+ "ents_f": 0.8425157484,
237
  "ents_per_type": {
238
  "DATE": {
239
+ "p": 0.8602484472,
240
+ "r": 0.8793650794,
241
+ "f": 0.8697017268
242
  },
243
  "GPE": {
244
+ "p": 0.9056603774,
245
+ "r": 0.8970711297,
246
+ "f": 0.9013452915
247
  },
248
  "ORDINAL": {
249
+ "p": 0.7703081232,
250
+ "r": 0.8540372671,
251
+ "f": 0.8100147275
252
  },
253
  "ORG": {
254
+ "p": 0.7932975185,
255
+ "r": 0.8221102863,
256
+ "f": 0.807446947
 
 
 
 
 
257
  },
258
  "CARDINAL": {
259
+ "p": 0.8078409718,
260
+ "r": 0.8697978597,
261
+ "f": 0.8376753507
262
+ },
263
+ "LOC": {
264
+ "p": 0.7148148148,
265
+ "r": 0.6146496815,
266
+ "f": 0.6609589041
267
  },
268
  "PERSON": {
269
+ "p": 0.8480543545,
270
+ "r": 0.8962140992,
271
+ "f": 0.8714693748
272
  },
273
  "NORP": {
274
+ "p": 0.91230893,
275
+ "r": 0.9072,
276
+ "f": 0.9097472924
277
  },
278
+ "QUANTITY": {
279
+ "p": 0.7954545455,
280
+ "r": 0.5769230769,
281
+ "f": 0.6687898089
282
  },
283
+ "FAC": {
284
+ "p": 0.3773584906,
285
+ "r": 0.3076923077,
286
+ "f": 0.3389830508
287
  },
288
+ "TIME": {
289
+ "p": 0.7477744807,
290
+ "r": 0.7368421053,
291
+ "f": 0.7422680412
292
  },
293
  "EVENT": {
294
+ "p": 0.585106383,
295
+ "r": 0.316091954,
296
+ "f": 0.4104477612
297
  },
298
  "WORK_OF_ART": {
299
+ "p": 0.5,
300
+ "r": 0.3608247423,
301
+ "f": 0.4191616766
302
  },
303
  "LAW": {
304
+ "p": 0.435483871,
305
+ "r": 0.421875,
306
+ "f": 0.4285714286
307
  },
308
  "MONEY": {
309
+ "p": 0.9240048251,
310
+ "r": 0.9043683589,
311
+ "f": 0.9140811456
 
 
 
 
 
312
  },
313
  "PRODUCT": {
314
+ "p": 0.5333333333,
315
  "r": 0.2274881517,
316
+ "f": 0.3189368771
317
+ },
318
+ "PERCENT": {
319
+ "p": 0.9154704944,
320
+ "r": 0.8790199081,
321
+ "f": 0.896875
322
  },
323
  "LANGUAGE": {
324
+ "p": 0.85,
325
+ "r": 0.53125,
326
+ "f": 0.6538461538
327
  }
328
  },
329
+ "speed": 9602.8922159566
330
  }
en_core_web_sm-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35365d49d389ecb19ba33119dca9ab9ff80b36fbeb063fa5d44008197fead8fa
3
- size 12803016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83872781dc64893d45d9dbe940e05f80df7e7196e169ea29e2e9742fed079549
3
+ size 12803038
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"en",
3
  "name":"core_web_sm",
4
- "version":"3.4.0",
5
  "description":"English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter, ner, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
  "spacy_version":">=3.4.0,<3.5.0",
11
- "spacy_git_version":"dd038b536",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -398,102 +398,102 @@
398
  "f":0.5714285714
399
  }
400
  },
401
- "ents_p":0.8565043157,
402
- "ents_r":0.8348858173,
403
- "ents_f":0.8455569081,
404
  "ents_per_type":{
405
  "DATE":{
406
- "p":0.8804768041,
407
- "r":0.8676190476,
408
- "f":0.8740006396
409
  },
410
  "GPE":{
411
- "p":0.9239884393,
412
- "r":0.8917712692,
413
- "f":0.9075940383
414
  },
415
  "ORDINAL":{
416
- "p":0.7910447761,
417
- "r":0.8229813665,
418
- "f":0.8066971081
419
  },
420
  "ORG":{
421
- "p":0.8107606679,
422
- "r":0.8109756098,
423
- "f":0.8108681246
424
- },
425
- "FAC":{
426
- "p":0.3902439024,
427
- "r":0.3692307692,
428
- "f":0.3794466403
429
  },
430
  "CARDINAL":{
431
- "p":0.8266978923,
432
- "r":0.8394768133,
433
- "f":0.8330383481
 
 
 
 
 
434
  },
435
  "PERSON":{
436
- "p":0.8648820905,
437
- "r":0.885770235,
438
- "f":0.8752015479
439
  },
440
  "NORP":{
441
- "p":0.9130787977,
442
- "r":0.8992,
443
- "f":0.9060862555
444
  },
445
- "TIME":{
446
- "p":0.7492163009,
447
- "r":0.6988304094,
448
- "f":0.7231467474
449
  },
450
- "LOC":{
451
- "p":0.7158273381,
452
- "r":0.6337579618,
453
- "f":0.6722972973
454
  },
455
- "QUANTITY":{
456
- "p":0.7971014493,
457
- "r":0.6043956044,
458
- "f":0.6875
459
  },
460
  "EVENT":{
461
- "p":0.6373626374,
462
- "r":0.3333333333,
463
- "f":0.4377358491
464
  },
465
  "WORK_OF_ART":{
466
- "p":0.5230769231,
467
- "r":0.3505154639,
468
- "f":0.4197530864
469
  },
470
  "LAW":{
471
- "p":0.6304347826,
472
- "r":0.453125,
473
- "f":0.5272727273
474
  },
475
  "MONEY":{
476
- "p":0.9179548157,
477
- "r":0.9114521842,
478
- "f":0.9146919431
479
- },
480
- "PERCENT":{
481
- "p":0.9171974522,
482
- "r":0.8820826953,
483
- "f":0.8992974239
484
  },
485
  "PRODUCT":{
486
- "p":0.5,
487
  "r":0.2274881517,
488
- "f":0.3127035831
 
 
 
 
 
489
  },
490
  "LANGUAGE":{
491
- "p":0.8,
492
- "r":0.625,
493
- "f":0.701754386
494
  }
495
  },
496
- "speed":9012.0225085527
497
  },
498
  "sources":[
499
  {
 
1
  {
2
  "lang":"en",
3
  "name":"core_web_sm",
4
+ "version":"3.4.1",
5
  "description":"English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter, ner, attribute_ruler, lemmatizer.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"MIT",
10
  "spacy_version":">=3.4.0,<3.5.0",
11
+ "spacy_git_version":"2b5f955c2",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
398
  "f":0.5714285714
399
  }
400
  },
401
+ "ents_p":0.8410860451,
402
+ "ents_r":0.8439503205,
403
+ "ents_f":0.8425157484,
404
  "ents_per_type":{
405
  "DATE":{
406
+ "p":0.8602484472,
407
+ "r":0.8793650794,
408
+ "f":0.8697017268
409
  },
410
  "GPE":{
411
+ "p":0.9056603774,
412
+ "r":0.8970711297,
413
+ "f":0.9013452915
414
  },
415
  "ORDINAL":{
416
+ "p":0.7703081232,
417
+ "r":0.8540372671,
418
+ "f":0.8100147275
419
  },
420
  "ORG":{
421
+ "p":0.7932975185,
422
+ "r":0.8221102863,
423
+ "f":0.807446947
 
 
 
 
 
424
  },
425
  "CARDINAL":{
426
+ "p":0.8078409718,
427
+ "r":0.8697978597,
428
+ "f":0.8376753507
429
+ },
430
+ "LOC":{
431
+ "p":0.7148148148,
432
+ "r":0.6146496815,
433
+ "f":0.6609589041
434
  },
435
  "PERSON":{
436
+ "p":0.8480543545,
437
+ "r":0.8962140992,
438
+ "f":0.8714693748
439
  },
440
  "NORP":{
441
+ "p":0.91230893,
442
+ "r":0.9072,
443
+ "f":0.9097472924
444
  },
445
+ "QUANTITY":{
446
+ "p":0.7954545455,
447
+ "r":0.5769230769,
448
+ "f":0.6687898089
449
  },
450
+ "FAC":{
451
+ "p":0.3773584906,
452
+ "r":0.3076923077,
453
+ "f":0.3389830508
454
  },
455
+ "TIME":{
456
+ "p":0.7477744807,
457
+ "r":0.7368421053,
458
+ "f":0.7422680412
459
  },
460
  "EVENT":{
461
+ "p":0.585106383,
462
+ "r":0.316091954,
463
+ "f":0.4104477612
464
  },
465
  "WORK_OF_ART":{
466
+ "p":0.5,
467
+ "r":0.3608247423,
468
+ "f":0.4191616766
469
  },
470
  "LAW":{
471
+ "p":0.435483871,
472
+ "r":0.421875,
473
+ "f":0.4285714286
474
  },
475
  "MONEY":{
476
+ "p":0.9240048251,
477
+ "r":0.9043683589,
478
+ "f":0.9140811456
 
 
 
 
 
479
  },
480
  "PRODUCT":{
481
+ "p":0.5333333333,
482
  "r":0.2274881517,
483
+ "f":0.3189368771
484
+ },
485
+ "PERCENT":{
486
+ "p":0.9154704944,
487
+ "r":0.8790199081,
488
+ "f":0.896875
489
  },
490
  "LANGUAGE":{
491
+ "p":0.85,
492
+ "r":0.53125,
493
+ "f":0.6538461538
494
  }
495
  },
496
+ "speed":9602.8922159566
497
  },
498
  "sources":[
499
  {
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9501662e93036b834cac45ad7014f9376ee2709606d82d79aa29e4243cdaca42
3
  size 6284763
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4fb108369f6a3a7739e485793203f1feeb3316434bbc9a9c07f2687be80ad65
3
  size 6284763