Commit
•
ff9acd3
1
Parent(s):
500cb7d
Update spaCy pipeline
Browse files- README.md +2 -2
- accuracy.json +9 -9
- config.cfg +1 -0
- fi_core_news_lg-any-py3-none-any.whl +2 -2
- meta.json +12 -12
- vocab/vectors.cfg +2 -1
README.md
CHANGED
@@ -78,8 +78,8 @@ Finnish pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer,
|
|
78 |
| Feature | Description |
|
79 |
| --- | --- |
|
80 |
| **Name** | `fi_core_news_lg` |
|
81 |
-
| **Version** | `3.
|
82 |
-
| **spaCy** | `>=3.
|
83 |
| **Default Pipeline** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
|
84 |
| **Components** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
|
85 |
| **Vectors** | floret (200000, 300) |
|
|
|
78 |
| Feature | Description |
|
79 |
| --- | --- |
|
80 |
| **Name** | `fi_core_news_lg` |
|
81 |
+
| **Version** | `3.7.0` |
|
82 |
+
| **spaCy** | `>=3.7.0,<3.8.0` |
|
83 |
| **Default Pipeline** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
|
84 |
| **Components** | `tok2vec`, `tagger`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
|
85 |
| **Vectors** | floret (200000, 300) |
|
accuracy.json
CHANGED
@@ -378,20 +378,20 @@
|
|
378 |
"r": 0.8258196721,
|
379 |
"f": 0.83436853
|
380 |
},
|
381 |
-
"
|
382 |
-
"p": 0.
|
383 |
-
"r": 0.
|
384 |
-
"f": 0.
|
385 |
},
|
386 |
"ORG": {
|
387 |
"p": 0.7785388128,
|
388 |
"r": 0.7875288684,
|
389 |
"f": 0.7830080367
|
390 |
},
|
391 |
-
"
|
392 |
-
"p": 0.
|
393 |
-
"r": 0.
|
394 |
-
"f": 0.
|
395 |
},
|
396 |
"PRODUCT": {
|
397 |
"p": 0.7095435685,
|
@@ -454,5 +454,5 @@
|
|
454 |
"f": 0.8275862069
|
455 |
}
|
456 |
},
|
457 |
-
"speed":
|
458 |
}
|
|
|
378 |
"r": 0.8258196721,
|
379 |
"f": 0.83436853
|
380 |
},
|
381 |
+
"WORK_OF_ART": {
|
382 |
+
"p": 0.6363636364,
|
383 |
+
"r": 0.375,
|
384 |
+
"f": 0.4719101124
|
385 |
},
|
386 |
"ORG": {
|
387 |
"p": 0.7785388128,
|
388 |
"r": 0.7875288684,
|
389 |
"f": 0.7830080367
|
390 |
},
|
391 |
+
"CARDINAL": {
|
392 |
+
"p": 0.9365079365,
|
393 |
+
"r": 0.9407744875,
|
394 |
+
"f": 0.9386363636
|
395 |
},
|
396 |
"PRODUCT": {
|
397 |
"p": 0.7095435685,
|
|
|
454 |
"f": 0.8275862069
|
455 |
}
|
456 |
},
|
457 |
+
"speed": 5922.5471697188
|
458 |
}
|
config.cfg
CHANGED
@@ -17,6 +17,7 @@ after_creation = null
|
|
17 |
after_pipeline_creation = null
|
18 |
batch_size = 256
|
19 |
tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
|
|
|
20 |
|
21 |
[components]
|
22 |
|
|
|
17 |
after_pipeline_creation = null
|
18 |
batch_size = 256
|
19 |
tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
|
20 |
+
vectors = {"@vectors":"spacy.Vectors.v1"}
|
21 |
|
22 |
[components]
|
23 |
|
fi_core_news_lg-any-py3-none-any.whl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6827aab0edbafec720b8dfe358e11c32409d3e2b4f827faf45dbf9267f6bb345
|
3 |
+
size 230768276
|
meta.json
CHANGED
@@ -1,14 +1,14 @@
|
|
1 |
{
|
2 |
"lang":"fi",
|
3 |
"name":"core_news_lg",
|
4 |
-
"version":"3.
|
5 |
"description":"Finnish pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
|
6 |
"author":"Explosion",
|
7 |
"email":"contact@explosion.ai",
|
8 |
"url":"https://explosion.ai",
|
9 |
"license":"CC BY-SA 4.0",
|
10 |
-
"spacy_version":">=3.
|
11 |
-
"spacy_git_version":"
|
12 |
"vectors":{
|
13 |
"width":300,
|
14 |
"vectors":200000,
|
@@ -2578,20 +2578,20 @@
|
|
2578 |
"r":0.8258196721,
|
2579 |
"f":0.83436853
|
2580 |
},
|
2581 |
-
"
|
2582 |
-
"p":0.
|
2583 |
-
"r":0.
|
2584 |
-
"f":0.
|
2585 |
},
|
2586 |
"ORG":{
|
2587 |
"p":0.7785388128,
|
2588 |
"r":0.7875288684,
|
2589 |
"f":0.7830080367
|
2590 |
},
|
2591 |
-
"
|
2592 |
-
"p":0.
|
2593 |
-
"r":0.
|
2594 |
-
"f":0.
|
2595 |
},
|
2596 |
"PRODUCT":{
|
2597 |
"p":0.7095435685,
|
@@ -2654,7 +2654,7 @@
|
|
2654 |
"f":0.8275862069
|
2655 |
}
|
2656 |
},
|
2657 |
-
"speed":
|
2658 |
},
|
2659 |
"sources":[
|
2660 |
{
|
|
|
1 |
{
|
2 |
"lang":"fi",
|
3 |
"name":"core_news_lg",
|
4 |
+
"version":"3.7.0",
|
5 |
"description":"Finnish pipeline optimized for CPU. Components: tok2vec, tagger, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner.",
|
6 |
"author":"Explosion",
|
7 |
"email":"contact@explosion.ai",
|
8 |
"url":"https://explosion.ai",
|
9 |
"license":"CC BY-SA 4.0",
|
10 |
+
"spacy_version":">=3.7.0,<3.8.0",
|
11 |
+
"spacy_git_version":"6b4f77441",
|
12 |
"vectors":{
|
13 |
"width":300,
|
14 |
"vectors":200000,
|
|
|
2578 |
"r":0.8258196721,
|
2579 |
"f":0.83436853
|
2580 |
},
|
2581 |
+
"WORK_OF_ART":{
|
2582 |
+
"p":0.6363636364,
|
2583 |
+
"r":0.375,
|
2584 |
+
"f":0.4719101124
|
2585 |
},
|
2586 |
"ORG":{
|
2587 |
"p":0.7785388128,
|
2588 |
"r":0.7875288684,
|
2589 |
"f":0.7830080367
|
2590 |
},
|
2591 |
+
"CARDINAL":{
|
2592 |
+
"p":0.9365079365,
|
2593 |
+
"r":0.9407744875,
|
2594 |
+
"f":0.9386363636
|
2595 |
},
|
2596 |
"PRODUCT":{
|
2597 |
"p":0.7095435685,
|
|
|
2654 |
"f":0.8275862069
|
2655 |
}
|
2656 |
},
|
2657 |
+
"speed":5922.5471697188
|
2658 |
},
|
2659 |
"sources":[
|
2660 |
{
|
vocab/vectors.cfg
CHANGED
@@ -5,5 +5,6 @@
|
|
5 |
"hash_count":2,
|
6 |
"hash_seed":2166136261,
|
7 |
"bow":"<",
|
8 |
-
"eow":">"
|
|
|
9 |
}
|
|
|
5 |
"hash_count":2,
|
6 |
"hash_seed":2166136261,
|
7 |
"bow":"<",
|
8 |
+
"eow":">",
|
9 |
+
"attr":65
|
10 |
}
|