marekk commited on
Commit
e472f7f
1 Parent(s): c8a432b

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -13,13 +13,13 @@ model-index:
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
- value: 0.8315789474
17
  - name: NER Recall
18
  type: recall
19
- value: 0.9076447194
20
  - name: NER F Score
21
  type: f_score
22
- value: 0.8679484471
23
  ---
24
  | Feature | Description |
25
  | --- | --- |
@@ -49,8 +49,8 @@ model-index:
49
 
50
  | Type | Score |
51
  | --- | --- |
52
- | `ENTS_F` | 86.79 |
53
- | `ENTS_P` | 83.16 |
54
- | `ENTS_R` | 90.76 |
55
- | `TRANSFORMER_LOSS` | 32794.24 |
56
- | `NER_LOSS` | 212387.08 |
 
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
+ value: 0.8621646623
17
  - name: NER Recall
18
  type: recall
19
+ value: 0.8825757576
20
  - name: NER F Score
21
  type: f_score
22
+ value: 0.8722508189
23
  ---
24
  | Feature | Description |
25
  | --- | --- |
 
49
 
50
  | Type | Score |
51
  | --- | --- |
52
+ | `ENTS_F` | 87.23 |
53
+ | `ENTS_P` | 86.22 |
54
+ | `ENTS_R` | 88.26 |
55
+ | `TRANSFORMER_LOSS` | 137449.06 |
56
+ | `NER_LOSS` | 323071.16 |
meta.json CHANGED
@@ -38,33 +38,33 @@
38
 
39
  ],
40
  "performance":{
41
- "ents_f":0.8679484471,
42
- "ents_p":0.8315789474,
43
- "ents_r":0.9076447194,
44
  "ents_per_type":{
45
- "PLAYER":{
46
- "p":0.774566474,
47
- "r":0.8993288591,
48
- "f":0.8322981366
49
- },
50
  "TOURNAMENT":{
51
- "p":0.8476190476,
52
- "r":0.9319371728,
53
- "f":0.8877805486
54
  },
55
  "TEAM":{
56
- "p":0.8985221675,
57
- "r":0.9258883249,
58
- "f":0.912
 
 
 
 
 
59
  },
60
  "ALIAS_TEAM":{
61
- "p":0.7647058824,
62
- "r":0.5909090909,
63
- "f":0.6666666667
64
  }
65
  },
66
- "transformer_loss":327.9424025911,
67
- "ner_loss":2123.8707888085
68
  },
69
  "requirements":[
70
  "spacy-transformers>=1.1.9,<1.2.0"
 
38
 
39
  ],
40
  "performance":{
41
+ "ents_f":0.8722508189,
42
+ "ents_p":0.8621646623,
43
+ "ents_r":0.8825757576,
44
  "ents_per_type":{
 
 
 
 
 
45
  "TOURNAMENT":{
46
+ "p":0.8691983122,
47
+ "r":0.8765957447,
48
+ "f":0.8728813559
49
  },
50
  "TEAM":{
51
+ "p":0.8995680346,
52
+ "r":0.8966630786,
53
+ "f":0.8981132075
54
+ },
55
+ "PLAYER":{
56
+ "p":0.8345398139,
57
+ "r":0.8838992333,
58
+ "f":0.8585106383
59
  },
60
  "ALIAS_TEAM":{
61
+ "p":0.5625,
62
+ "r":0.5142857143,
63
+ "f":0.5373134328
64
  }
65
  },
66
+ "transformer_loss":1374.4906167755,
67
+ "ner_loss":3230.7115738995
68
  },
69
  "requirements":[
70
  "spacy-transformers>=1.1.9,<1.2.0"
ner/model CHANGED
Binary files a/ner/model and b/ner/model differ
 
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves� {"0":{},"1":{"PLAYER":5606,"TEAM":4463,"TOURNAMENT":1790,"ALIAS_TEAM":93},"2":{"PLAYER":5606,"TEAM":4463,"TOURNAMENT":1790,"ALIAS_TEAM":93},"3":{"PLAYER":5606,"TEAM":4463,"TOURNAMENT":1790,"ALIAS_TEAM":93},"4":{"PLAYER":5606,"TEAM":4463,"TOURNAMENT":1790,"ALIAS_TEAM":93,"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��moves�${"0":{},"1":{"PLAYER":5847,"TEAM":4522,"TOURNAMENT":1678,"ALIAS_TEAM":105},"2":{"PLAYER":5847,"TEAM":4522,"TOURNAMENT":1678,"ALIAS_TEAM":105},"3":{"PLAYER":5847,"TEAM":4522,"TOURNAMENT":1678,"ALIAS_TEAM":105},"4":{"PLAYER":5847,"TEAM":4522,"TOURNAMENT":1678,"ALIAS_TEAM":105,"":1},"5":{"":1}}�cfg��neg_key�
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e45bd72109efeaea3ba2e903b7b7e9d1167fc6aa9bda3b350573372b2e140f8
3
  size 672945750
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c13db7e693e38eede67fec56cda81604f168449a3ef3faef53733df83edface
3
  size 672945750
vocab/strings.json CHANGED
@@ -91,6 +91,7 @@
91
  "-p",
92
  "-x",
93
  "-|",
 
94
  ".",
95
  "..",
96
  "...",
@@ -706,6 +707,8 @@
706
  "997",
707
  "998",
708
  "999",
 
 
709
  "9th",
710
  ":",
711
  ":'(",
@@ -2848,7 +2851,7 @@
2848
  "Golovin",
2849
  "Gomese",
2850
  "Gones",
2851
- "Gonzalez",
2852
  "Gonz\u00e1lezovi",
2853
  "Good",
2854
  "Goodison",
@@ -3747,7 +3750,7 @@
3747
  "Kempn\u00fd",
3748
  "Kenin",
3749
  "Kent",
3750
- "Kenya",
3751
  "Kepa",
3752
  "Kepovi",
3753
  "Kern",
@@ -4938,6 +4941,7 @@
4938
  "Next",
4939
  "NextGen",
4940
  "Neymar",
 
4941
  "Neymarovi",
4942
  "Nezapomenu",
4943
  "Nezapom\u00ednejme",
@@ -5302,6 +5306,7 @@
5302
  "PR",
5303
  "PROFILE",
5304
  "PSG",
 
5305
  "PSL",
5306
  "PSV",
5307
  "Pace",
@@ -5974,7 +5979,7 @@
5974
  "Rishi",
5975
  "Rising",
5976
  "Rittich",
5977
- "Rivera",
5978
  "Riviera",
5979
  "Riyad",
5980
  "Riyadh",
@@ -7579,6 +7584,7 @@
7579
  "XI",
7580
  "XX",
7581
  "XXX",
 
7582
  "XXXX",
7583
  "XXXX-dd",
7584
  "XXXX_XXXX",
@@ -7609,6 +7615,7 @@
7609
  "XxxxXxx",
7610
  "Xxxxd",
7611
  "Xxxxx",
 
7612
  "Xxxxx'Xxxxx",
7613
  "Xxxxx+Xxxxx",
7614
  "Xxxxx-dd",
@@ -11147,6 +11154,7 @@
11147
  "dom\u00e1c\u00edmu",
11148
  "dom\u016f",
11149
  "don",
 
11150
  "don't",
11151
  "donati",
11152
  "donating",
@@ -12952,7 +12960,7 @@
12952
  "gone",
12953
  "gones",
12954
  "gong",
12955
- "gonzalez",
12956
  "gonz\u00e1lezovi",
12957
  "good",
12958
  "goodison",
@@ -14957,7 +14965,7 @@
14957
  "ken",
14958
  "kenin",
14959
  "kent",
14960
- "kenya",
14961
  "kepa",
14962
  "kepovi",
14963
  "kept",
@@ -15877,7 +15885,6 @@
15877
  "lex",
15878
  "ley",
15879
  "leylah",
15880
- "lez",
15881
  "le\u010d",
15882
  "le\u0161",
15883
  "le\u017e\u00ed",
@@ -18271,6 +18278,7 @@
18271
  "nextgen",
18272
  "ney",
18273
  "neymar",
 
18274
  "neymarovi",
18275
  "nez",
18276
  "nezabalil",
@@ -18644,7 +18652,6 @@
18644
  "nuts",
18645
  "nu\u0161",
18646
  "ny",
18647
- "nya",
18648
  "nyi",
18649
  "nylander",
18650
  "nym",
@@ -21387,6 +21394,7 @@
21387
  "pr\u016f\u017eek",
21388
  "pse",
21389
  "psg",
 
21390
  "psi",
21391
  "psl",
21392
  "psota",
@@ -22535,7 +22543,7 @@
22535
  "rivals",
22536
  "rivaly",
22537
  "rival\u016f",
22538
- "rivera",
22539
  "riviera",
22540
  "rix",
22541
  "riyad",
@@ -27684,6 +27692,7 @@
27684
  "worst",
27685
  "worth",
27686
  "would",
 
27687
  "wouldn\u2019t",
27688
  "wozniacki",
27689
  "wrap",
@@ -27751,10 +27760,12 @@
27751
  "xxd",
27752
  "xxdd",
27753
  "xxx",
 
27754
  "xxx'x",
27755
  "xxx'xx",
27756
  "xxxx",
27757
  "xxxx\"-",
 
27758
  "xxxx'",
27759
  "xxxx'x",
27760
  "xxxx'xx",
@@ -30178,7 +30189,6 @@
30178
  "\u0ca0",
30179
  "\u0ca0_\u0ca0",
30180
  "\u0ca0\ufe35\u0ca0",
30181
- "\u2013",
30182
  "\u2014",
30183
  "\u2018",
30184
  "\u2019",
@@ -30197,7 +30207,6 @@
30197
  "\u202075",
30198
  "\u2020dd",
30199
  "\u2026",
30200
- "\u2060",
30201
  "\u20ac",
30202
  "\u2122",
30203
  "\u2501",
 
91
  "-p",
92
  "-x",
93
  "-|",
94
+ "-\u2060",
95
  ".",
96
  "..",
97
  "...",
 
707
  "997",
708
  "998",
709
  "999",
710
+ "9;s",
711
+ "9;t",
712
  "9th",
713
  ":",
714
  ":'(",
 
2851
  "Golovin",
2852
  "Gomese",
2853
  "Gones",
2854
+ "Gonzalez&#039;s",
2855
  "Gonz\u00e1lezovi",
2856
  "Good",
2857
  "Goodison",
 
3750
  "Kempn\u00fd",
3751
  "Kenin",
3752
  "Kent",
3753
+ "Kenya&#039;s",
3754
  "Kepa",
3755
  "Kepovi",
3756
  "Kern",
 
4941
  "Next",
4942
  "NextGen",
4943
  "Neymar",
4944
+ "Neymar&#039;s",
4945
  "Neymarovi",
4946
  "Nezapomenu",
4947
  "Nezapom\u00ednejme",
 
5306
  "PR",
5307
  "PROFILE",
5308
  "PSG",
5309
+ "PSG&#039;s",
5310
  "PSL",
5311
  "PSV",
5312
  "Pace",
 
5979
  "Rishi",
5980
  "Rising",
5981
  "Rittich",
5982
+ "Rivera&#039;s",
5983
  "Riviera",
5984
  "Riyad",
5985
  "Riyadh",
 
7584
  "XI",
7585
  "XX",
7586
  "XXX",
7587
+ "XXX&#ddd;x",
7588
  "XXXX",
7589
  "XXXX-dd",
7590
  "XXXX_XXXX",
 
7615
  "XxxxXxx",
7616
  "Xxxxd",
7617
  "Xxxxx",
7618
+ "Xxxxx&#ddd;x",
7619
  "Xxxxx'Xxxxx",
7620
  "Xxxxx+Xxxxx",
7621
  "Xxxxx-dd",
 
11154
  "dom\u00e1c\u00edmu",
11155
  "dom\u016f",
11156
  "don",
11157
+ "don&#039;t",
11158
  "don't",
11159
  "donati",
11160
  "donating",
 
12960
  "gone",
12961
  "gones",
12962
  "gong",
12963
+ "gonzalez&#039;s",
12964
  "gonz\u00e1lezovi",
12965
  "good",
12966
  "goodison",
 
14965
  "ken",
14966
  "kenin",
14967
  "kent",
14968
+ "kenya&#039;s",
14969
  "kepa",
14970
  "kepovi",
14971
  "kept",
 
15885
  "lex",
15886
  "ley",
15887
  "leylah",
 
15888
  "le\u010d",
15889
  "le\u0161",
15890
  "le\u017e\u00ed",
 
18278
  "nextgen",
18279
  "ney",
18280
  "neymar",
18281
+ "neymar&#039;s",
18282
  "neymarovi",
18283
  "nez",
18284
  "nezabalil",
 
18652
  "nuts",
18653
  "nu\u0161",
18654
  "ny",
 
18655
  "nyi",
18656
  "nylander",
18657
  "nym",
 
21394
  "pr\u016f\u017eek",
21395
  "pse",
21396
  "psg",
21397
+ "psg&#039;s",
21398
  "psi",
21399
  "psl",
21400
  "psota",
 
22543
  "rivals",
22544
  "rivaly",
22545
  "rival\u016f",
22546
+ "rivera&#039;s",
22547
  "riviera",
22548
  "rix",
22549
  "riyad",
 
27692
  "worst",
27693
  "worth",
27694
  "would",
27695
+ "wouldn&#039;t",
27696
  "wouldn\u2019t",
27697
  "wozniacki",
27698
  "wrap",
 
27760
  "xxd",
27761
  "xxdd",
27762
  "xxx",
27763
+ "xxx&#ddd;x",
27764
  "xxx'x",
27765
  "xxx'xx",
27766
  "xxxx",
27767
  "xxxx\"-",
27768
+ "xxxx&#ddd;x",
27769
  "xxxx'",
27770
  "xxxx'x",
27771
  "xxxx'xx",
 
30189
  "\u0ca0",
30190
  "\u0ca0_\u0ca0",
30191
  "\u0ca0\ufe35\u0ca0",
 
30192
  "\u2014",
30193
  "\u2018",
30194
  "\u2019",
 
30207
  "\u202075",
30208
  "\u2020dd",
30209
  "\u2026",
 
30210
  "\u20ac",
30211
  "\u2122",
30212
  "\u2501",
xx_ner_sport_entities_uncased-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b65ce1dc3ec9d1d4d0e1dc58d21dc7879f8b1d14a2634bf300b7ca9c7b7f65d9
3
- size 622787729
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dbad133202d1a63918219317a3146c137921fbb89f068e266395f2c7219ac24
3
+ size 622789555