ljvmiranda921 commited on
Commit
0271b42
1 Parent(s): edbfd20

xx_orv_sigtyp_trf-0.1.0: Update SIGTYP pipeline

Browse files
.gitattributes CHANGED
@@ -39,3 +39,4 @@ trainable_lemmatizer/model filter=lfs diff=lfs merge=lfs -text
39
  trainable_lemmatizer/trees filter=lfs diff=lfs merge=lfs -text
40
  transformer/model filter=lfs diff=lfs merge=lfs -text
41
  xx_orv_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
 
 
39
  trainable_lemmatizer/trees filter=lfs diff=lfs merge=lfs -text
40
  transformer/model filter=lfs diff=lfs merge=lfs -text
41
  xx_orv_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
42
+ morphologizer/model filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
The diff for this file is too large to render. See raw diff
 
config.cfg CHANGED
@@ -10,7 +10,7 @@ seed = 42
10
 
11
  [nlp]
12
  lang = "xx"
13
- pipeline = ["transformer","parser","trainable_lemmatizer","tagger"]
14
  batch_size = 128
15
  disabled = []
16
  before_creation = null
@@ -20,6 +20,24 @@ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
 
21
  [components]
22
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  [components.parser]
24
  factory = "parser"
25
  learn_tokens = false
@@ -166,14 +184,17 @@ total_steps = 20000
166
  initial_rate = 0.00005
167
 
168
  [training.score_weights]
169
- dep_uas = 0.17
170
- dep_las = 0.17
171
  dep_las_per_type = null
172
  sents_p = null
173
  sents_r = null
174
  sents_f = 0.0
175
- lemma_acc = 0.33
176
- tag_acc = 0.33
 
 
 
177
 
178
  [pretraining]
179
 
 
10
 
11
  [nlp]
12
  lang = "xx"
13
+ pipeline = ["transformer","parser","trainable_lemmatizer","tagger","morphologizer"]
14
  batch_size = 128
15
  disabled = []
16
  before_creation = null
 
20
 
21
  [components]
22
 
23
+ [components.morphologizer]
24
+ factory = "morphologizer"
25
+ extend = false
26
+ label_smoothing = 0.0
27
+ overwrite = true
28
+ scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
29
+
30
+ [components.morphologizer.model]
31
+ @architectures = "spacy.Tagger.v2"
32
+ nO = null
33
+ normalize = false
34
+
35
+ [components.morphologizer.model.tok2vec]
36
+ @architectures = "spacy-transformers.TransformerListener.v1"
37
+ grad_factor = 1.0
38
+ pooling = {"@layers":"reduce_mean.v1"}
39
+ upstream = "*"
40
+
41
  [components.parser]
42
  factory = "parser"
43
  learn_tokens = false
 
184
  initial_rate = 0.00005
185
 
186
  [training.score_weights]
187
+ dep_uas = 0.09
188
+ dep_las = 0.09
189
  dep_las_per_type = null
190
  sents_p = null
191
  sents_r = null
192
  sents_f = 0.0
193
+ lemma_acc = 0.17
194
+ tag_acc = 0.17
195
+ pos_acc = 0.25
196
+ morph_acc = 0.25
197
+ morph_per_feat = null
198
 
199
  [pretraining]
200
 
meta.json CHANGED
The diff for this file is too large to render. See raw diff
 
morphologizer/cfg ADDED
The diff for this file is too large to render. See raw diff
 
morphologizer/model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb773a5a59260b1ab93c94b92ea01891a385523a9a448224ca83b04a59d4ee0b
3
+ size 7370749
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7f1a6800277cb2e6b287e106bc78a94f32104e732a88427f4ff8c4de4ffc03c
3
  size 1832547
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf7e52432ff66b1d3e54faec21af92a2d2ed6de196e9f13387bbc8c739b6377
3
  size 1832547
tagger/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b61a86cdba64044fb121fa4f72b883cc00b2c542ef269f283aabb8a8b9af6c2
3
  size 8767253
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f07fba30f9ff1756339a8079674cefe0d4ab289d0e31c3cfef1174515283130
3
  size 8767253
trainable_lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84f29b4ee82bb5c5818e9a57d6cf43d379d685876556e43db7d12788c6ab8e78
3
  size 19262565
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c88bb8d2de5720091d03c8b55f923d5d62f3c9a5955e3aae451f4971c99478bf
3
  size 19262565
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e0d76d528ff62a1f69608d1c2f801d7e389dc61a6a111dd7cf5d8bd38ca56a8
3
  size 509231398
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ef171cd8618d934df2e4793afb5446d99029f939b2ceaa75e759383e7a8b1c5
3
  size 509231398
vocab/strings.json CHANGED
The diff for this file is too large to render. See raw diff
 
xx_orv_sigtyp_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cbf8848c22350053ff0ede89d9fef47dc13434475020d73f32d20ca2fa8e1e91
3
- size 494760653
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:955a19951381def93e98f32c3ea5292eeaba9c5162b9adba70b60697125cc52f
3
+ size 501696219