adrianeboyd commited on
Commit
e993b45
1 Parent(s): 4fa16d3

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -71,8 +71,8 @@ Korean pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer, p
71
  | Feature | Description |
72
  | --- | --- |
73
  | **Name** | `ko_core_news_sm` |
74
- | **Version** | `3.5.0` |
75
- | **spaCy** | `>=3.5.0,<3.6.0` |
76
  | **Default Pipeline** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
77
  | **Components** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
78
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
71
  | Feature | Description |
72
  | --- | --- |
73
  | **Name** | `ko_core_news_sm` |
74
+ | **Version** | `3.6.0` |
75
+ | **spaCy** | `>=3.6.0,<3.7.0` |
76
  | **Default Pipeline** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
77
  | **Components** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
78
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
accuracy.json CHANGED
@@ -158,7 +158,7 @@
158
  }
159
  },
160
  "lemma_acc": 0.8356969086,
161
- "speed": 11675.4379543036,
162
  "ents_p": 0.7704418068,
163
  "ents_r": 0.6603320381,
164
  "ents_f": 0.7111499981,
 
158
  }
159
  },
160
  "lemma_acc": 0.8356969086,
161
+ "speed": 12541.6084143237,
162
  "ents_p": 0.7704418068,
163
  "ents_r": 0.6603320381,
164
  "ents_f": 0.7111499981,
config.cfg CHANGED
@@ -46,6 +46,7 @@ upstream = "tok2vec"
46
  [components.morphologizer]
47
  factory = "morphologizer"
48
  extend = false
 
49
  overwrite = true
50
  scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
51
 
@@ -143,6 +144,7 @@ maxout_pieces = 2
143
 
144
  [components.tagger]
145
  factory = "tagger"
 
146
  neg_prefix = "!"
147
  overwrite = false
148
  scorer = {"@scorers":"spacy.tagger_scorer.v1"}
 
46
  [components.morphologizer]
47
  factory = "morphologizer"
48
  extend = false
49
+ label_smoothing = 0.0
50
  overwrite = true
51
  scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
52
 
 
144
 
145
  [components.tagger]
146
  factory = "tagger"
147
+ label_smoothing = 0.0
148
  neg_prefix = "!"
149
  overwrite = false
150
  scorer = {"@scorers":"spacy.tagger_scorer.v1"}
ko_core_news_sm-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:383ce09dc37ee707d8db0e9321e9b081749000ab4250369738f62cbb79265b63
3
- size 14700533
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d30c7b10fdb310787f9e09f633aa1239e0e46cbe120b635f2a572c09ea635e57
3
+ size 14700581
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"ko",
3
  "name":"core_news_sm",
4
- "version":"3.5.0",
5
  "description":"Korean pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
- "spacy_version":">=3.5.0,<3.6.0",
11
- "spacy_git_version":"9e0322de1",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -2241,7 +2241,7 @@
2241
  }
2242
  },
2243
  "lemma_acc":0.8356969086,
2244
- "speed":11675.4379543036,
2245
  "ents_p":0.7704418068,
2246
  "ents_r":0.6603320381,
2247
  "ents_f":0.7111499981,
 
1
  {
2
  "lang":"ko",
3
  "name":"core_news_sm",
4
+ "version":"3.6.0",
5
  "description":"Korean pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
+ "spacy_version":">=3.6.0,<3.7.0",
11
+ "spacy_git_version":"cb4fdc83e",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
2241
  }
2242
  },
2243
  "lemma_acc":0.8356969086,
2244
+ "speed":12541.6084143237,
2245
  "ents_p":0.7704418068,
2246
  "ents_r":0.6603320381,
2247
  "ents_f":0.7111499981,
morphologizer/cfg CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "extend":false,
 
3
  "labels_morph":{
4
  "POS=CCONJ":"",
5
  "POS=ADV":"",
 
1
  {
2
  "extend":false,
3
+ "label_smoothing":0.0,
4
  "labels_morph":{
5
  "POS=CCONJ":"",
6
  "POS=ADV":"",
tagger/cfg CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "labels":[
3
  "_SP",
4
  "ecs",
 
1
  {
2
+ "label_smoothing":0.0,
3
  "labels":[
4
  "_SP",
5
  "ecs",