ljvmiranda921 commited on
Commit
e34b9b9
1 Parent(s): c2f58f2

xx_isl_sigtyp_trf-0.1.0: Update SIGTYP pipeline

Browse files
.gitattributes CHANGED
@@ -38,3 +38,4 @@ tagger/model filter=lfs diff=lfs merge=lfs -text
38
  trainable_lemmatizer/model filter=lfs diff=lfs merge=lfs -text
39
  transformer/model filter=lfs diff=lfs merge=lfs -text
40
  xx_isl_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
 
 
38
  trainable_lemmatizer/model filter=lfs diff=lfs merge=lfs -text
39
  transformer/model filter=lfs diff=lfs merge=lfs -text
40
  xx_isl_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
41
+ morphologizer/model filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
The diff for this file is too large to render. See raw diff
 
config.cfg CHANGED
@@ -10,7 +10,7 @@ seed = 42
10
 
11
  [nlp]
12
  lang = "xx"
13
- pipeline = ["transformer","parser","trainable_lemmatizer","tagger"]
14
  batch_size = 128
15
  disabled = []
16
  before_creation = null
@@ -20,6 +20,24 @@ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
 
21
  [components]
22
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  [components.parser]
24
  factory = "parser"
25
  learn_tokens = false
@@ -166,14 +184,17 @@ total_steps = 20000
166
  initial_rate = 0.00005
167
 
168
  [training.score_weights]
169
- dep_uas = 0.17
170
- dep_las = 0.17
171
  dep_las_per_type = null
172
  sents_p = null
173
  sents_r = null
174
  sents_f = 0.0
175
- lemma_acc = 0.33
176
- tag_acc = 0.33
 
 
 
177
 
178
  [pretraining]
179
 
 
10
 
11
  [nlp]
12
  lang = "xx"
13
+ pipeline = ["transformer","parser","trainable_lemmatizer","tagger","morphologizer"]
14
  batch_size = 128
15
  disabled = []
16
  before_creation = null
 
20
 
21
  [components]
22
 
23
+ [components.morphologizer]
24
+ factory = "morphologizer"
25
+ extend = false
26
+ label_smoothing = 0.0
27
+ overwrite = true
28
+ scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
29
+
30
+ [components.morphologizer.model]
31
+ @architectures = "spacy.Tagger.v2"
32
+ nO = null
33
+ normalize = false
34
+
35
+ [components.morphologizer.model.tok2vec]
36
+ @architectures = "spacy-transformers.TransformerListener.v1"
37
+ grad_factor = 1.0
38
+ pooling = {"@layers":"reduce_mean.v1"}
39
+ upstream = "*"
40
+
41
  [components.parser]
42
  factory = "parser"
43
  learn_tokens = false
 
184
  initial_rate = 0.00005
185
 
186
  [training.score_weights]
187
+ dep_uas = 0.09
188
+ dep_las = 0.09
189
  dep_las_per_type = null
190
  sents_p = null
191
  sents_r = null
192
  sents_f = 0.0
193
+ lemma_acc = 0.17
194
+ tag_acc = 0.17
195
+ pos_acc = 0.25
196
+ morph_acc = 0.25
197
+ morph_per_feat = null
198
 
199
  [pretraining]
200
 
meta.json CHANGED
The diff for this file is too large to render. See raw diff
 
morphologizer/cfg ADDED
The diff for this file is too large to render. See raw diff
 
morphologizer/model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:453994e50d6484f39261f82b6376808c100990b5fc8d328618f2fac111df88d5
3
+ size 5974245
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69c30acd70be3434bc3ce5382afdb854fd1e8ec29b332cf4da3df81b32c6eb20
3
  size 1175559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70eb85ad39e07714702e6fead64df823820ba9667a356e754a4659ab9ac54ef8
3
  size 1175559
tagger/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe4bf05b750133bb11e2c9e16104b40558df40c334d86c43dd65a29564f40466
3
  size 15826673
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88c47e0973dc30f6629e22c0f805bb31ebc1e265b60cb876a46b669d8c0ac8db
3
  size 15826673
trainable_lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffe2fa5e33ba0c005fe4af5c8616ddf4dd7f7e9a37a6ffd947c86410c7bfc516
3
  size 7952113
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:185230d3e6972749a373bd191beb01be7981f1adade2e872c9ef5a1e5e94830d
3
  size 7952113
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4b360d29f4c09cff9fa7e22cff4704e04f11c0953048e72197b8a87f495b20f
3
  size 509231398
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e50291f7bf15b3e46763a6f4ffc4b0b2cd338573d94069770cf85863ef91cd
3
  size 509231398
vocab/strings.json CHANGED
The diff for this file is too large to render. See raw diff
 
xx_isl_sigtyp_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b1b9f1d7c92968dd6bb61ffdc809a48b47d82941ccb19033f6fe1f732e423b9
3
- size 489611257
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffaf69231647aeb0ca1845e0f95b868f5460a6735d8a9b909e81bfaf947145a6
3
+ size 495232504