adrianeboyd commited on
Commit
00dfd7d
1 Parent(s): 50add8c

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -71,8 +71,8 @@ Korean pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer, p
71
  | Feature | Description |
72
  | --- | --- |
73
  | **Name** | `ko_core_news_md` |
74
- | **Version** | `3.6.0` |
75
- | **spaCy** | `>=3.6.0,<3.7.0` |
76
  | **Default Pipeline** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
77
  | **Components** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
78
  | **Vectors** | floret (50000, 300) |
 
71
  | Feature | Description |
72
  | --- | --- |
73
  | **Name** | `ko_core_news_md` |
74
+ | **Version** | `3.7.0` |
75
+ | **spaCy** | `>=3.7.0,<3.8.0` |
76
  | **Default Pipeline** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
77
  | **Components** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
78
  | **Vectors** | floret (50000, 300) |
accuracy.json CHANGED
@@ -158,7 +158,7 @@
158
  }
159
  },
160
  "lemma_acc": 0.8994244348,
161
- "speed": 7769.6433830297,
162
  "ents_p": 0.8497178497,
163
  "ents_r": 0.8084775698,
164
  "ents_f": 0.8285848749,
 
158
  }
159
  },
160
  "lemma_acc": 0.8994244348,
161
+ "speed": 7383.8635768128,
162
  "ents_p": 0.8497178497,
163
  "ents_r": 0.8084775698,
164
  "ents_f": 0.8285848749,
config.cfg CHANGED
@@ -17,6 +17,7 @@ after_creation = null
17
  after_pipeline_creation = null
18
  batch_size = 256
19
  tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
 
20
 
21
  [components]
22
 
 
17
  after_pipeline_creation = null
18
  batch_size = 256
19
  tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
+ vectors = {"@vectors":"spacy.Vectors.v1"}
21
 
22
  [components]
23
 
ko_core_news_md-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ed68cf208e6999d8e0e781c72a03aad996462ff21ffc7b853da5e2680a9f067
3
- size 69046245
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97565293b1916eb20a47ec9bc96ee58aa8c334787d7a30b0efbea63ba6205165
3
+ size 69046261
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"ko",
3
  "name":"core_news_md",
4
- "version":"3.6.0",
5
  "description":"Korean pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
- "spacy_version":">=3.6.0,<3.7.0",
11
- "spacy_git_version":"cb4fdc83e",
12
  "vectors":{
13
  "width":300,
14
  "vectors":50000,
@@ -2241,7 +2241,7 @@
2241
  }
2242
  },
2243
  "lemma_acc":0.8994244348,
2244
- "speed":7769.6433830297,
2245
  "ents_p":0.8497178497,
2246
  "ents_r":0.8084775698,
2247
  "ents_f":0.8285848749,
 
1
  {
2
  "lang":"ko",
3
  "name":"core_news_md",
4
+ "version":"3.7.0",
5
  "description":"Korean pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
+ "spacy_version":">=3.7.0,<3.8.0",
11
+ "spacy_git_version":"6b4f77441",
12
  "vectors":{
13
  "width":300,
14
  "vectors":50000,
 
2241
  }
2242
  },
2243
  "lemma_acc":0.8994244348,
2244
+ "speed":7383.8635768128,
2245
  "ents_p":0.8497178497,
2246
  "ents_r":0.8084775698,
2247
  "ents_f":0.8285848749,
vocab/vectors.cfg CHANGED
@@ -5,5 +5,6 @@
5
  "hash_count":2,
6
  "hash_seed":2166136261,
7
  "bow":"<",
8
- "eow":">"
 
9
  }
 
5
  "hash_count":2,
6
  "hash_seed":2166136261,
7
  "bow":"<",
8
+ "eow":">",
9
+ "attr":65
10
  }