Ybhav14 commited on
Commit
f44250d
1 Parent(s): ff1bf07

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -13,22 +13,22 @@ model-index:
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
- value: 0.9918793503
17
  - name: NER Recall
18
  type: recall
19
- value: 0.9965034965
20
  - name: NER F Score
21
  type: f_score
22
- value: 0.9941860465
23
  ---
24
  | Feature | Description |
25
  | --- | --- |
26
  | **Name** | `en_Spacy_Custom_ner2` |
27
  | **Version** | `0.0.0` |
28
- | **spaCy** | `>=3.5.3,<3.6.0` |
29
  | **Default Pipeline** | `tok2vec`, `ner` |
30
  | **Components** | `tok2vec`, `ner` |
31
- | **Vectors** | 514157 keys, 514157 unique vectors (300 dimensions) |
32
  | **Sources** | n/a |
33
  | **License** | n/a |
34
  | **Author** | [n/a]() |
@@ -37,11 +37,11 @@ model-index:
37
 
38
  <details>
39
 
40
- <summary>View label scheme (16 labels for 1 components)</summary>
41
 
42
  | Component | Labels |
43
  | --- | --- |
44
- | **`ner`** | `AGENT_FALLBACK`, `BOOK`, `COMODITY`, `CONTAINER COUNT`, `CONTAINER SIZE`, `CONTAINER SIZE-COUNT`, `DESTINATION`, `ENQUIRY`, `HELP`, `INCOTERM`, `KYC`, `ORIGIN`, `SEARCH RATES`, `SHIP`, `SHIPMENT TYPE`, `WELCOME_MSG` |
45
 
46
  </details>
47
 
@@ -49,8 +49,8 @@ model-index:
49
 
50
  | Type | Score |
51
  | --- | --- |
52
- | `ENTS_F` | 99.42 |
53
- | `ENTS_P` | 99.19 |
54
- | `ENTS_R` | 99.65 |
55
- | `TOK2VEC_LOSS` | 1794.25 |
56
- | `NER_LOSS` | 53209.43 |
 
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
+ value: 0.9907894737
17
  - name: NER Recall
18
  type: recall
19
+ value: 0.996031746
20
  - name: NER F Score
21
  type: f_score
22
+ value: 0.9934036939
23
  ---
24
  | Feature | Description |
25
  | --- | --- |
26
  | **Name** | `en_Spacy_Custom_ner2` |
27
  | **Version** | `0.0.0` |
28
+ | **spaCy** | `>=3.7.2,<3.8.0` |
29
  | **Default Pipeline** | `tok2vec`, `ner` |
30
  | **Components** | `tok2vec`, `ner` |
31
+ | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
32
  | **Sources** | n/a |
33
  | **License** | n/a |
34
  | **Author** | [n/a]() |
 
37
 
38
  <details>
39
 
40
+ <summary>View label scheme (14 labels for 1 components)</summary>
41
 
42
  | Component | Labels |
43
  | --- | --- |
44
+ | **`ner`** | `BOOK`, `COMODITY`, `CONTAINER COUNT`, `CONTAINER SIZE`, `CONTAINER SIZE-COUNT`, `DESTINATION`, `ENQUIRY`, `HELP`, `INCOTERM`, `KYC`, `ORIGIN`, `SEARCH RATES`, `SHIP`, `SHIPMENT TYPE` |
45
 
46
  </details>
47
 
 
49
 
50
  | Type | Score |
51
  | --- | --- |
52
+ | `ENTS_F` | 99.34 |
53
+ | `ENTS_P` | 99.08 |
54
+ | `ENTS_R` | 99.60 |
55
+ | `TOK2VEC_LOSS` | 7290.77 |
56
+ | `NER_LOSS` | 70900.21 |
config.cfg CHANGED
@@ -1,7 +1,7 @@
1
  [paths]
2
  train = "./training_data.spacy"
3
  dev = "./training_data.spacy"
4
- vectors = "en_core_web_lg"
5
  init_tok2vec = null
6
 
7
  [system]
@@ -11,12 +11,13 @@ seed = 0
11
  [nlp]
12
  lang = "en"
13
  pipeline = ["tok2vec","ner"]
14
- batch_size = 100
15
  disabled = []
16
  before_creation = null
17
  after_creation = null
18
  after_pipeline_creation = null
19
  tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
 
20
 
21
  [components]
22
 
@@ -52,12 +53,12 @@ factory = "tok2vec"
52
  width = ${components.tok2vec.model.encode.width}
53
  attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
54
  rows = [5000,1000,2500,2500]
55
- include_static_vectors = true
56
 
57
  [components.tok2vec.model.encode]
58
  @architectures = "spacy.MaxoutWindowEncoder.v2"
59
- width = 256
60
- depth = 8
61
  window_size = 1
62
  maxout_pieces = 3
63
 
 
1
  [paths]
2
  train = "./training_data.spacy"
3
  dev = "./training_data.spacy"
4
+ vectors = null
5
  init_tok2vec = null
6
 
7
  [system]
 
11
  [nlp]
12
  lang = "en"
13
  pipeline = ["tok2vec","ner"]
14
+ batch_size = 1000
15
  disabled = []
16
  before_creation = null
17
  after_creation = null
18
  after_pipeline_creation = null
19
  tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
+ vectors = {"@vectors":"spacy.Vectors.v1"}
21
 
22
  [components]
23
 
 
53
  width = ${components.tok2vec.model.encode.width}
54
  attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
55
  rows = [5000,1000,2500,2500]
56
+ include_static_vectors = false
57
 
58
  [components.tok2vec.model.encode]
59
  @architectures = "spacy.MaxoutWindowEncoder.v2"
60
+ width = 96
61
+ depth = 4
62
  window_size = 1
63
  maxout_pieces = 3
64
 
en_Spacy_Custom_ner2-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8302181463c63c9c2a84b1a5857d8cbd80d5bed66594f0961b8c62fa5802db9
3
- size 606745646
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55064fcd52899715cf7a340a538072dad8f74dcf882ce630db03851860b2bc73
3
+ size 5688225
meta.json CHANGED
@@ -7,20 +7,19 @@
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
- "spacy_version":">=3.5.3,<3.6.0",
11
- "spacy_git_version":"Unknown",
12
  "vectors":{
13
- "width":300,
14
- "vectors":514157,
15
- "keys":514157,
16
- "name":"en_vectors"
17
  },
18
  "labels":{
19
  "tok2vec":[
20
 
21
  ],
22
  "ner":[
23
- "AGENT_FALLBACK",
24
  "BOOK",
25
  "COMODITY",
26
  "CONTAINER COUNT",
@@ -34,8 +33,7 @@
34
  "ORIGIN",
35
  "SEARCH RATES",
36
  "SHIP",
37
- "SHIPMENT TYPE",
38
- "WELCOME_MSG"
39
  ]
40
  },
41
  "pipeline":[
@@ -50,24 +48,29 @@
50
 
51
  ],
52
  "performance":{
53
- "ents_f":0.9941860465,
54
- "ents_p":0.9918793503,
55
- "ents_r":0.9965034965,
56
  "ents_per_type":{
57
- "SEARCH RATES":{
58
  "p":1.0,
59
  "r":1.0,
60
  "f":1.0
61
  },
62
- "ORIGIN":{
 
 
 
 
 
63
  "p":1.0,
64
  "r":1.0,
65
  "f":1.0
66
  },
67
- "DESTINATION":{
68
- "p":0.9903846154,
69
  "r":1.0,
70
- "f":0.9951690821
71
  },
72
  "BOOK":{
73
  "p":1.0,
@@ -75,24 +78,19 @@
75
  "f":1.0
76
  },
77
  "SHIP":{
78
- "p":0.987804878,
79
  "r":1.0,
80
- "f":0.9938650307
81
  },
82
  "CONTAINER SIZE":{
83
- "p":0.9905660377,
84
- "r":0.9905660377,
85
- "f":0.9905660377
86
- },
87
- "SHIPMENT TYPE":{
88
  "p":1.0,
89
- "r":1.0,
90
- "f":1.0
91
  },
92
  "ENQUIRY":{
93
- "p":0.8823529412,
94
  "r":1.0,
95
- "f":0.9375
96
  },
97
  "HELP":{
98
  "p":1.0,
@@ -110,9 +108,9 @@
110
  "f":1.0
111
  },
112
  "COMODITY":{
113
- "p":0.9523809524,
114
- "r":0.9523809524,
115
- "f":0.9523809524
116
  },
117
  "CONTAINER COUNT":{
118
  "p":1.0,
@@ -120,23 +118,13 @@
120
  "f":1.0
121
  },
122
  "CONTAINER SIZE-COUNT":{
123
- "p":1.0,
124
- "r":0.9615384615,
125
- "f":0.9803921569
126
- },
127
- "AGENT_FALLBACK":{
128
- "p":1.0,
129
  "r":1.0,
130
- "f":1.0
131
- },
132
- "WELCOME_MSG":{
133
- "p":1.0,
134
- "r":1.0,
135
- "f":1.0
136
  }
137
  },
138
- "tok2vec_loss":17.9424619099,
139
- "ner_loss":532.0943451776
140
  },
141
  "requirements":[
142
 
 
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
+ "spacy_version":">=3.7.2,<3.8.0",
11
+ "spacy_git_version":"a89eae928",
12
  "vectors":{
13
+ "width":0,
14
+ "vectors":0,
15
+ "keys":0,
16
+ "name":null
17
  },
18
  "labels":{
19
  "tok2vec":[
20
 
21
  ],
22
  "ner":[
 
23
  "BOOK",
24
  "COMODITY",
25
  "CONTAINER COUNT",
 
33
  "ORIGIN",
34
  "SEARCH RATES",
35
  "SHIP",
36
+ "SHIPMENT TYPE"
 
37
  ]
38
  },
39
  "pipeline":[
 
48
 
49
  ],
50
  "performance":{
51
+ "ents_f":0.9934036939,
52
+ "ents_p":0.9907894737,
53
+ "ents_r":0.996031746,
54
  "ents_per_type":{
55
+ "ORIGIN":{
56
  "p":1.0,
57
  "r":1.0,
58
  "f":1.0
59
  },
60
+ "DESTINATION":{
61
+ "p":0.995,
62
+ "r":0.995,
63
+ "f":0.995
64
+ },
65
+ "SHIPMENT TYPE":{
66
  "p":1.0,
67
  "r":1.0,
68
  "f":1.0
69
  },
70
+ "SEARCH RATES":{
71
+ "p":1.0,
72
  "r":1.0,
73
+ "f":1.0
74
  },
75
  "BOOK":{
76
  "p":1.0,
 
78
  "f":1.0
79
  },
80
  "SHIP":{
81
+ "p":0.987654321,
82
  "r":1.0,
83
+ "f":0.9937888199
84
  },
85
  "CONTAINER SIZE":{
 
 
 
 
 
86
  "p":1.0,
87
+ "r":0.9795918367,
88
+ "f":0.9896907216
89
  },
90
  "ENQUIRY":{
91
+ "p":0.875,
92
  "r":1.0,
93
+ "f":0.9333333333
94
  },
95
  "HELP":{
96
  "p":1.0,
 
108
  "f":1.0
109
  },
110
  "COMODITY":{
111
+ "p":0.9130434783,
112
+ "r":1.0,
113
+ "f":0.9545454545
114
  },
115
  "CONTAINER COUNT":{
116
  "p":1.0,
 
118
  "f":1.0
119
  },
120
  "CONTAINER SIZE-COUNT":{
121
+ "p":0.962962963,
 
 
 
 
 
122
  "r":1.0,
123
+ "f":0.9811320755
 
 
 
 
 
124
  }
125
  },
126
+ "tok2vec_loss":72.9077196514,
127
+ "ner_loss":709.0020859699
128
  },
129
  "requirements":[
130
 
ner/model CHANGED
Binary files a/ner/model and b/ner/model differ
 
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves�{"0":{},"1":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"2":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"3":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"4":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2,"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��moves�|{"0":{},"1":{"DESTINATION":313,"ORIGIN":295,"CONTAINER SIZE":174,"SHIP":80,"SHIPMENT TYPE":60,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":17,"INCOTERM":9,"HELP":8,"CONTAINER COUNT":8,"SEARCH RATES":7,"KYC":2},"2":{"DESTINATION":313,"ORIGIN":295,"CONTAINER SIZE":174,"SHIP":80,"SHIPMENT TYPE":60,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":17,"INCOTERM":9,"HELP":8,"CONTAINER COUNT":8,"SEARCH RATES":7,"KYC":2},"3":{"DESTINATION":313,"ORIGIN":295,"CONTAINER SIZE":174,"SHIP":80,"SHIPMENT TYPE":60,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":17,"INCOTERM":9,"HELP":8,"CONTAINER COUNT":8,"SEARCH RATES":7,"KYC":2},"4":{"DESTINATION":313,"ORIGIN":295,"CONTAINER SIZE":174,"SHIP":80,"SHIPMENT TYPE":60,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":17,"INCOTERM":9,"HELP":8,"CONTAINER COUNT":8,"SEARCH RATES":7,"KYC":2,"":1},"5":{"":1}}�cfg��neg_key�
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e2f3e2fab9f568a5c3e23cbe9aa9f9e7e51da3c44d61ed32c617696964b45eb
3
- size 34434008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:242b2c12c6efec38ede80c052b45333201ddec15e45ce1ff6f486fc9888e6c8f
3
+ size 6009091
vocab/key2row CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31566ae010da3d399eb1d930ae142757afd2601034a4be3bdb00d18881c8c06a
3
- size 7066303
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76be8b528d0075f7aae98d6fa57a6d3c83ae480a8469e668d7b0af968995ac71
3
+ size 1
vocab/strings.json CHANGED
The diff for this file is too large to render. See raw diff
 
vocab/vectors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:234dcf234bfdf01775ae6182715d55eaacfcde8555b189f25440b56d3c39fd5d
3
- size 616988528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14772b683e726436d5948ad3fff2b43d036ef2ebbe3458aafed6004e05a40706
3
+ size 128