cbruinsm commited on
Commit
9500de3
1 Parent(s): 12ec1bb

Update spaCy pipeline

Browse files
Files changed (8) hide show
  1. README.md +12 -11
  2. config.cfg +2 -2
  3. en_Coff_Ev1-any-py3-none-any.whl +2 -2
  4. meta.json +47 -47
  5. ner/model +0 -0
  6. ner/moves +1 -1
  7. tok2vec/model +1 -1
  8. vocab/strings.json +23 -0
README.md CHANGED
@@ -4,6 +4,7 @@ tags:
4
  - token-classification
5
  language:
6
  - en
 
7
  model-index:
8
  - name: en_Coff_Ev1
9
  results:
@@ -13,26 +14,26 @@ model-index:
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
- value: 0.9920977011
17
  - name: NER Recall
18
  type: recall
19
- value: 0.9913854989
20
  - name: NER F Score
21
  type: f_score
22
- value: 0.9917414722
23
  ---
24
- A natural language processor API for coffee drinks in all forms built from nearly 500+ different coffee drinks for Starbucks and Beyond
25
 
26
  | Feature | Description |
27
  | --- | --- |
28
  | **Name** | `en_Coff_Ev1` |
29
- | **Version** | `1.1.1` |
30
  | **spaCy** | `>=3.4.3,<3.5.0` |
31
  | **Default Pipeline** | `tok2vec`, `ner` |
32
  | **Components** | `tok2vec`, `ner` |
33
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
34
  | **Sources** | n/a |
35
- | **License** | n/a |
36
  | **Author** | [Chris Bruinsma,Iris Chi,Jack Felciano,Jeffrey Li,Dustin Paden]() |
37
 
38
  ### Label Scheme
@@ -51,8 +52,8 @@ A natural language processor API for coffee drinks in all forms built from nearl
51
 
52
  | Type | Score |
53
  | --- | --- |
54
- | `ENTS_F` | 99.17 |
55
- | `ENTS_P` | 99.21 |
56
- | `ENTS_R` | 99.14 |
57
- | `TOK2VEC_LOSS` | 19296.40 |
58
- | `NER_LOSS` | 157988.43 |
 
4
  - token-classification
5
  language:
6
  - en
7
+ license: mit
8
  model-index:
9
  - name: en_Coff_Ev1
10
  results:
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.9928104575
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.9921619856
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.9924861156
24
  ---
25
+ A natural language processor API for coffee drinks in all forms built from nearly 500+ different coffee drinks for Starbucks and your local coffee shop
26
 
27
  | Feature | Description |
28
  | --- | --- |
29
  | **Name** | `en_Coff_Ev1` |
30
+ | **Version** | `1.1.2` |
31
  | **spaCy** | `>=3.4.3,<3.5.0` |
32
  | **Default Pipeline** | `tok2vec`, `ner` |
33
  | **Components** | `tok2vec`, `ner` |
34
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
35
  | **Sources** | n/a |
36
+ | **License** | `MIT` |
37
  | **Author** | [Chris Bruinsma,Iris Chi,Jack Felciano,Jeffrey Li,Dustin Paden]() |
38
 
39
  ### Label Scheme
 
52
 
53
  | Type | Score |
54
  | --- | --- |
55
+ | `ENTS_F` | 99.25 |
56
+ | `ENTS_P` | 99.28 |
57
+ | `ENTS_R` | 99.22 |
58
+ | `TOK2VEC_LOSS` | 79694.90 |
59
+ | `NER_LOSS` | 189668.04 |
config.cfg CHANGED
@@ -11,7 +11,7 @@ seed = 0
11
  [nlp]
12
  lang = "en"
13
  pipeline = ["tok2vec","ner"]
14
- batch_size = 1000
15
  disabled = []
16
  before_creation = null
17
  after_creation = null
@@ -120,7 +120,7 @@ L2 = 0.01
120
  grad_clip = 1.0
121
  use_averages = false
122
  eps = 0.00000001
123
- learn_rate = 0.001
124
 
125
  [training.score_weights]
126
  ents_f = 1.0
 
11
  [nlp]
12
  lang = "en"
13
  pipeline = ["tok2vec","ner"]
14
+ batch_size = 50
15
  disabled = []
16
  before_creation = null
17
  after_creation = null
 
120
  grad_clip = 1.0
121
  use_averages = false
122
  eps = 0.00000001
123
+ learn_rate = 0.0001
124
 
125
  [training.score_weights]
126
  ents_f = 1.0
en_Coff_Ev1-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:315972a987b782003aa34763a116a114ecf458dd3e9fc93c4d20bdff4ac6ba35
3
- size 5683919
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbad8e5131e5d8b00eec847a453d1b20730c4d2cbe8cdab89716dfd2a36b6d47
3
+ size 5673787
meta.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "lang":"en",
3
  "name":"Coff_Ev1",
4
- "version":"1.1.1",
5
- "description":"A natural language processor API for coffee drinks in all forms built from 400+ different coffee drinks for Starbucks and Beyond",
6
  "author":"Chris Bruinsma,Iris Chi,Jack Felciano,Jeffrey Li,Dustin Paden",
7
- "email":"",
8
  "url":"",
9
- "license":"",
10
  "spacy_version":">=3.4.3,<3.5.0",
11
  "spacy_git_version":"63673a792",
12
  "vectors":{
@@ -48,36 +48,51 @@
48
 
49
  ],
50
  "performance":{
51
- "ents_f":0.9917414722,
52
- "ents_p":0.9920977011,
53
- "ents_r":0.9913854989,
54
  "ents_per_type":{
55
- "size":{
56
- "p":0.9968152866,
57
- "r":0.9968152866,
58
- "f":0.9968152866
59
- },
60
  "toppings":{
61
- "p":1.0,
62
- "r":0.9838709677,
63
- "f":0.9918699187
 
 
 
 
 
64
  },
65
  "drink":{
66
- "p":0.9913043478,
67
- "r":0.9934640523,
68
- "f":0.992383025
 
 
 
 
 
69
  },
70
  "Anti":{
71
  "p":1.0,
72
  "r":1.0,
73
  "f":1.0
74
  },
75
- "syrup":{
76
- "p":0.9953703704,
77
- "r":0.9953703704,
78
- "f":0.9953703704
79
  },
80
- "upside-down":{
 
 
 
 
 
 
 
 
 
 
81
  "p":1.0,
82
  "r":1.0,
83
  "f":1.0
@@ -87,44 +102,29 @@
87
  "r":1.0,
88
  "f":1.0
89
  },
90
- "pump quantity":{
91
- "p":1.0,
92
- "r":0.9285714286,
93
- "f":0.962962963
94
  },
95
- "milk":{
96
  "p":1.0,
97
  "r":1.0,
98
  "f":1.0
99
  },
100
  "milk texture":{
101
- "p":0.8888888889,
102
- "r":1.0,
103
- "f":0.9411764706
104
- },
105
- "temperature":{
106
  "p":1.0,
107
- "r":0.990990991,
108
- "f":0.9954751131
109
  },
110
  "roast":{
111
  "p":1.0,
112
  "r":0.9523809524,
113
  "f":0.9756097561
114
- },
115
- "shot quality":{
116
- "p":0.9375,
117
- "r":0.9375,
118
- "f":0.9375
119
- },
120
- "shot quantity":{
121
- "p":0.8421052632,
122
- "r":0.9411764706,
123
- "f":0.8888888889
124
  }
125
  },
126
- "tok2vec_loss":192.9639828272,
127
- "ner_loss":1579.8842665188
128
  },
129
  "requirements":[
130
 
 
1
  {
2
  "lang":"en",
3
  "name":"Coff_Ev1",
4
+ "version":"1.1.2",
5
+ "description":"A natural language processor API for coffee drinks in all forms built from nearly 500+ different coffee drinks for Starbucks and your local coffee shop",
6
  "author":"Chris Bruinsma,Iris Chi,Jack Felciano,Jeffrey Li,Dustin Paden",
7
+ "email":"christopher.j.bruinsm@outlook.com",
8
  "url":"",
9
+ "license":"MIT",
10
  "spacy_version":">=3.4.3,<3.5.0",
11
  "spacy_git_version":"63673a792",
12
  "vectors":{
 
48
 
49
  ],
50
  "performance":{
51
+ "ents_f":0.9924861156,
52
+ "ents_p":0.9928104575,
53
+ "ents_r":0.9921619856,
54
  "ents_per_type":{
 
 
 
 
 
55
  "toppings":{
56
+ "p":0.9855072464,
57
+ "r":1.0,
58
+ "f":0.9927007299
59
+ },
60
+ "syrup":{
61
+ "p":0.9957627119,
62
+ "r":0.9957627119,
63
+ "f":0.9957627119
64
  },
65
  "drink":{
66
+ "p":0.9920634921,
67
+ "r":0.9940357853,
68
+ "f":0.9930486594
69
+ },
70
+ "size":{
71
+ "p":0.9970845481,
72
+ "r":0.9970845481,
73
+ "f":0.9970845481
74
  },
75
  "Anti":{
76
  "p":1.0,
77
  "r":1.0,
78
  "f":1.0
79
  },
80
+ "temperature":{
81
+ "p":1.0,
82
+ "r":0.9914529915,
83
+ "f":0.9957081545
84
  },
85
+ "pump quantity":{
86
+ "p":0.9375,
87
+ "r":1.0,
88
+ "f":0.9677419355
89
+ },
90
+ "shot quality":{
91
+ "p":1.0,
92
+ "r":0.9130434783,
93
+ "f":0.9545454545
94
+ },
95
+ "milk":{
96
  "p":1.0,
97
  "r":1.0,
98
  "f":1.0
 
102
  "r":1.0,
103
  "f":1.0
104
  },
105
+ "shot quantity":{
106
+ "p":0.9259259259,
107
+ "r":0.9259259259,
108
+ "f":0.9259259259
109
  },
110
+ "upside-down":{
111
  "p":1.0,
112
  "r":1.0,
113
  "f":1.0
114
  },
115
  "milk texture":{
 
 
 
 
 
116
  "p":1.0,
117
+ "r":0.875,
118
+ "f":0.9333333333
119
  },
120
  "roast":{
121
  "p":1.0,
122
  "r":0.9523809524,
123
  "f":0.9756097561
 
 
 
 
 
 
 
 
 
 
124
  }
125
  },
126
+ "tok2vec_loss":796.9489580916,
127
+ "ner_loss":1896.6804416175
128
  },
129
  "requirements":[
130
 
ner/model CHANGED
Binary files a/ner/model and b/ner/model differ
 
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves�T{"0":{},"1":{"drink":811,"syrup":336,"size":318,"milk":167,"toppings":149,"temperature":123,"pump quantity":54,"Anti":53,"shot quantity":24,"roast":24,"shot quality":22,"extra":15,"upside-down":12,"milk texture":9},"2":{"drink":811,"syrup":336,"size":318,"milk":167,"toppings":149,"temperature":123,"pump quantity":54,"Anti":53,"shot quantity":24,"roast":24,"shot quality":22,"extra":15,"upside-down":12,"milk texture":9},"3":{"drink":811,"syrup":336,"size":318,"milk":167,"toppings":149,"temperature":123,"pump quantity":54,"Anti":53,"shot quantity":24,"roast":24,"shot quality":22,"extra":15,"upside-down":12,"milk texture":9},"4":{"drink":811,"syrup":336,"size":318,"milk":167,"toppings":149,"temperature":123,"pump quantity":54,"Anti":53,"shot quantity":24,"roast":24,"shot quality":22,"extra":15,"upside-down":12,"milk texture":9,"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��moves�T{"0":{},"1":{"drink":880,"syrup":367,"size":347,"milk":187,"toppings":160,"temperature":129,"Anti":59,"pump quantity":58,"shot quality":35,"shot quantity":34,"roast":24,"extra":17,"upside-down":12,"milk texture":9},"2":{"drink":880,"syrup":367,"size":347,"milk":187,"toppings":160,"temperature":129,"Anti":59,"pump quantity":58,"shot quality":35,"shot quantity":34,"roast":24,"extra":17,"upside-down":12,"milk texture":9},"3":{"drink":880,"syrup":367,"size":347,"milk":187,"toppings":160,"temperature":129,"Anti":59,"pump quantity":58,"shot quality":35,"shot quantity":34,"roast":24,"extra":17,"upside-down":12,"milk texture":9},"4":{"drink":880,"syrup":367,"size":347,"milk":187,"toppings":160,"temperature":129,"Anti":59,"pump quantity":58,"shot quality":35,"shot quantity":34,"roast":24,"extra":17,"upside-down":12,"milk texture":9,"":1},"5":{"":1}}�cfg��neg_key�
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7486fa28a815ae9a31bae531c2440aabb59ca684f63e9a378987383d552a747
3
  size 6009091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd132f7fca40616523d8c55bc18dcbb8ff56c835fdcb86d2a82f93c8f4aac355
3
  size 6009091
vocab/strings.json CHANGED
@@ -346,6 +346,7 @@
346
  "Colo",
347
  "Colo.",
348
  "Colorado",
 
349
  "Conn",
350
  "Conn.",
351
  "Connecticut",
@@ -398,9 +399,11 @@
398
  "Florida",
399
  "Foamy",
400
  "Fog",
 
401
  "Frappe",
402
  "Frappeccino",
403
  "Frappuccino",
 
404
  "Fresher",
405
  "G",
406
  "Ga",
@@ -432,6 +435,7 @@
432
  "He's",
433
  "He\u2019s",
434
  "Hi",
 
435
  "Hot",
436
  "How",
437
  "How's",
@@ -505,6 +509,7 @@
505
  "Ltd.",
506
  "M",
507
  "Ma'am",
 
508
  "Mango",
509
  "Mar",
510
  "Mar.",
@@ -608,6 +613,7 @@
608
  "P",
609
  "Pa",
610
  "Pa.",
 
611
  "Paradise",
612
  "Passion",
613
  "Peach",
@@ -623,6 +629,7 @@
623
  "Praline",
624
  "Prof",
625
  "Prof.",
 
626
  "Pumpkin",
627
  "R",
628
  "ROOT",
@@ -633,8 +640,10 @@
633
  "Rep.",
634
  "Rev",
635
  "Rev.",
 
636
  "Room",
637
  "S",
 
638
  "S.C.",
639
  "Sen",
640
  "Sen.",
@@ -650,12 +659,14 @@
650
  "She\u2019s",
651
  "Short",
652
  "Should",
 
653
  "Small",
654
  "Somethin",
655
  "Somethin'",
656
  "Somethin\u2019",
657
  "South Carolina",
658
  "Soy",
 
659
  "Spiced",
660
  "St",
661
  "St.",
@@ -813,6 +824,7 @@
813
  "ado",
814
  "afe",
815
  "aff",
 
816
  "ai",
817
  "ak",
818
  "ak.",
@@ -860,6 +872,7 @@
860
  "a\u00e7a\u00ed",
861
  "b",
862
  "b.",
 
863
  "base",
864
  "bean",
865
  "because",
@@ -898,6 +911,7 @@
898
  "calif",
899
  "calif.",
900
  "can",
 
901
  "cappuccino",
902
  "cappuchino",
903
  "caramel",
@@ -948,6 +962,7 @@
948
  "crumble",
949
  "crunch",
950
  "ct.",
 
951
  "customized",
952
  "cuz",
953
  "c\u2019m",
@@ -1050,10 +1065,12 @@
1050
  "foam",
1051
  "foamy",
1052
  "fog",
 
1053
  "frappe",
1054
  "frappeccino",
1055
  "frappuccino",
1056
  "frappuchino",
 
1057
  "free",
1058
  "french",
1059
  "fresher",
@@ -1220,6 +1237,7 @@
1220
  "let\u2019s",
1221
  "lif",
1222
  "light",
 
1223
  "ll",
1224
  "ll.",
1225
  "lla",
@@ -1252,6 +1270,7 @@
1252
  "md",
1253
  "md.",
1254
  "med",
 
1255
  "medium",
1256
  "mega",
1257
  "mel",
@@ -1437,6 +1456,7 @@
1437
  "pump quantity",
1438
  "pumpkin",
1439
  "pumps",
 
1440
  "q",
1441
  "q.",
1442
  "quad",
@@ -1452,6 +1472,7 @@
1452
  "refreshers",
1453
  "rep",
1454
  "rep.",
 
1455
  "rev",
1456
  "rev.",
1457
  "rew",
@@ -1474,6 +1495,7 @@
1474
  "rup",
1475
  "rus",
1476
  "s",
 
1477
  "s's",
1478
  "s.",
1479
  "s.c.",
@@ -1567,6 +1589,7 @@
1567
  "this\u2019s",
1568
  "those",
1569
  "three",
 
1570
  "to",
1571
  "toasted",
1572
  "toffee",
 
346
  "Colo",
347
  "Colo.",
348
  "Colorado",
349
+ "Con",
350
  "Conn",
351
  "Conn.",
352
  "Connecticut",
 
399
  "Florida",
400
  "Foamy",
401
  "Fog",
402
+ "Four",
403
  "Frappe",
404
  "Frappeccino",
405
  "Frappuccino",
406
+ "Frappucino",
407
  "Fresher",
408
  "G",
409
  "Ga",
 
435
  "He's",
436
  "He\u2019s",
437
  "Hi",
438
+ "Honey",
439
  "Hot",
440
  "How",
441
  "How's",
 
509
  "Ltd.",
510
  "M",
511
  "Ma'am",
512
+ "Macchiato",
513
  "Mango",
514
  "Mar",
515
  "Mar.",
 
613
  "P",
614
  "Pa",
615
  "Pa.",
616
+ "Panna",
617
  "Paradise",
618
  "Passion",
619
  "Peach",
 
629
  "Praline",
630
  "Prof",
631
  "Prof.",
632
+ "Pump",
633
  "Pumpkin",
634
  "R",
635
  "ROOT",
 
640
  "Rep.",
641
  "Rev",
642
  "Rev.",
643
+ "Ristretto",
644
  "Room",
645
  "S",
646
+ "S'mores",
647
  "S.C.",
648
  "Sen",
649
  "Sen.",
 
659
  "She\u2019s",
660
  "Short",
661
  "Should",
662
+ "Skinny",
663
  "Small",
664
  "Somethin",
665
  "Somethin'",
666
  "Somethin\u2019",
667
  "South Carolina",
668
  "Soy",
669
+ "Spice",
670
  "Spiced",
671
  "St",
672
  "St.",
 
824
  "ado",
825
  "afe",
826
  "aff",
827
+ "affagato",
828
  "ai",
829
  "ak",
830
  "ak.",
 
872
  "a\u00e7a\u00ed",
873
  "b",
874
  "b.",
875
+ "ball",
876
  "base",
877
  "bean",
878
  "because",
 
911
  "calif",
912
  "calif.",
913
  "can",
914
+ "cap",
915
  "cappuccino",
916
  "cappuchino",
917
  "caramel",
 
962
  "crumble",
963
  "crunch",
964
  "ct.",
965
+ "cup",
966
  "customized",
967
  "cuz",
968
  "c\u2019m",
 
1065
  "foam",
1066
  "foamy",
1067
  "fog",
1068
+ "four",
1069
  "frappe",
1070
  "frappeccino",
1071
  "frappuccino",
1072
  "frappuchino",
1073
+ "frappucino",
1074
  "free",
1075
  "french",
1076
  "fresher",
 
1237
  "let\u2019s",
1238
  "lif",
1239
  "light",
1240
+ "lightly",
1241
  "ll",
1242
  "ll.",
1243
  "lla",
 
1270
  "md",
1271
  "md.",
1272
  "med",
1273
+ "medicine",
1274
  "medium",
1275
  "mega",
1276
  "mel",
 
1456
  "pump quantity",
1457
  "pumpkin",
1458
  "pumps",
1459
+ "pup",
1460
  "q",
1461
  "q.",
1462
  "quad",
 
1472
  "refreshers",
1473
  "rep",
1474
  "rep.",
1475
+ "res",
1476
  "rev",
1477
  "rev.",
1478
  "rew",
 
1495
  "rup",
1496
  "rus",
1497
  "s",
1498
+ "s'mores",
1499
  "s's",
1500
  "s.",
1501
  "s.c.",
 
1589
  "this\u2019s",
1590
  "those",
1591
  "three",
1592
+ "tly",
1593
  "to",
1594
  "toasted",
1595
  "toffee",