crodri commited on
Commit
8fe03f2
1 Parent(s): c930a7e

new lemmas test

Browse files
.gitattributes CHANGED
@@ -32,3 +32,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ ca_bsc_core_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
36
+ transformer/model filter=lfs diff=lfs merge=lfs -text
37
+ parser/model filter=lfs diff=lfs merge=lfs -text
38
+ tagger/model filter=lfs diff=lfs merge=lfs -text
39
+ morphologizer/model filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,123 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - spacy
4
+ - token-classification
5
+ language:
6
+ - ca
7
+ license: mit
8
+ model-index:
9
+ - name: ca_bsc_core_trf
10
+ results:
11
+ - task:
12
+ name: NER
13
+ type: token-classification
14
+ metrics:
15
+ - name: NER Precision
16
+ type: precision
17
+ value: 0.8993650794
18
+ - name: NER Recall
19
+ type: recall
20
+ value: 0.8959519292
21
+ - name: NER F Score
22
+ type: f_score
23
+ value: 0.8976552598
24
+ - task:
25
+ name: TAG
26
+ type: token-classification
27
+ metrics:
28
+ - name: TAG (XPOS) Accuracy
29
+ type: accuracy
30
+ value: 0.9751561894
31
+ - task:
32
+ name: POS
33
+ type: token-classification
34
+ metrics:
35
+ - name: POS (UPOS) Accuracy
36
+ type: accuracy
37
+ value: 0.9923557547
38
+ - task:
39
+ name: MORPH
40
+ type: token-classification
41
+ metrics:
42
+ - name: Morph (UFeats) Accuracy
43
+ type: accuracy
44
+ value: 0.9896239098
45
+ - task:
46
+ name: LEMMA
47
+ type: token-classification
48
+ metrics:
49
+ - name: Lemma Accuracy
50
+ type: accuracy
51
+ value: 0.9648130959
52
+ - task:
53
+ name: UNLABELED_DEPENDENCIES
54
+ type: token-classification
55
+ metrics:
56
+ - name: Unlabeled Attachment Score (UAS)
57
+ type: f_score
58
+ value: 0.9525272994
59
+ - task:
60
+ name: LABELED_DEPENDENCIES
61
+ type: token-classification
62
+ metrics:
63
+ - name: Labeled Attachment Score (LAS)
64
+ type: f_score
65
+ value: 0.934621442
66
+ - task:
67
+ name: SENTS
68
+ type: token-classification
69
+ metrics:
70
+ - name: Sentences F-Score
71
+ type: f_score
72
+ value: 0.9973676514
73
+ ---
74
+ testing new lemma dictionaries
75
+
76
+ | Feature | Description |
77
+ | --- | --- |
78
+ | **Name** | `ca_bsc_core_trf` |
79
+ | **Version** | `3.4.5` |
80
+ | **spaCy** | `>=3.4.1,<3.5.0` |
81
+ | **Default Pipeline** | `transformer`, `tagger`, `morphologizer`, `lemmatizer`, `parser`, `ner` |
82
+ | **Components** | `transformer`, `tagger`, `morphologizer`, `lemmatizer`, `parser`, `ner` |
83
+ | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
84
+ | **Sources** | n/a |
85
+ | **License** | `mit` |
86
+ | **Author** | [n/a]() |
87
+
88
+ ### Label Scheme
89
+
90
+ <details>
91
+
92
+ <summary>View label scheme (600 labels for 4 components)</summary>
93
+
94
+ | Component | Labels |
95
+ | --- | --- |
96
+ | **`tagger`** | `ADJ`, `ADP`, `ADV`, `AUX`, `CCONJ`, `DET`, `INTJ`, `NOUN`, `NUM`, `PART`, `PRON`, `PROPN`, `PUNCT`, `SCONJ`, `SYM`, `VERB`, `ao0cs0`, `ao0fp0`, `ao0fs0`, `ao0mp0`, `ao0ms0`, `aq0cn0`, `aq0cp0`, `aq0cp00`, `aq0cs0`, `aq0fp0`, `aq0fpp`, `aq0fs0`, `aq0fsp`, `aq0mp0`, `aq0mpp`, `aq0ms0`, `aq0msp`, `cc`, `cs`, `da0cs0`, `da0fp0`, `da0fs0`, `da0mp0`, `da0ms0`, `dd0cp0`, `dd0cs0`, `dd0fp0`, `dd0fs0`, `dd0mp0`, `dd0ms0`, `de0cn0`, `di0cn0`, `di0cp0`, `di0cs0`, `di0fp0`, `di0fs0`, `di0mp0`, `di0ms0`, `dn0cp0`, `dn0cs0`, `dn0fp0`, `dn0fs0`, `dn0mp0`, `dn0ms0`, `dp1cpp`, `dp1fpp`, `dp1fps`, `dp1fsp`, `dp1fss`, `dp1mpp`, `dp1mps`, `dp1msp`, `dp1mss`, `dp2fss`, `dp2mps`, `dp2mss`, `dp3fp0`, `dp3fs0`, `dp3mp0`, `dp3ms0`, `dr0cs0`, `dt0fp0`, `dt0fs0`, `dt0mp0`, `dt0ms0`, `faa`, `fat`, `fc`, `fca`, `fct`, `fd`, `fe`, `fg`, `fh`, `fia`, `fit`, `fp`, `fpa`, `fpt`, `fs`, `fx`, `fz`, `nc00000`, `nccn000`, `nccp000`, `nccs000`, `ncfn000`, `ncfp000`, `ncfs000`, `ncmn000`, `ncmp000`, `ncms000`, `np00000`, `np0000a`, `np0000d`, `np0000l`, `np0000o`, `np0000p`, `p0000000`, `p010p000`, `p010s000`, `p020p000`, `p020s000`, `p0300000`, `pd0cp000`, `pd0cs000`, `pd0fp000`, `pd0fs000`, `pd0mp000`, `pd0ms000`, `pd0ns000`, `pi0cn000`, `pi0cp000`, `pi0cs000`, `pi0fp000`, `pi0fs000`, `pi0mp0`, `pi0mp000`, `pi0ms000`, `pn0cp000`, `pn0cs000`, `pn0fp000`, `pn0fs000`, `pn0mp000`, `pn0ms000`, `pp1cp000`, `pp1cs000`, `pp1csn00`, `pp1cso00`, `pp2cp000`, `pp2cp00p`, `pp2cs000`, `pp2cs00p`, `pp3cn000`, `pp3cno00`, `pp3cp000`, `pp3csa00`, `pp3csd00`, `pp3fp000`, `pp3fpa00`, `pp3fs000`, `pp3fsa00`, `pp3mp000`, `pp3mpa00`, `pp3ms000`, `pp3msa00`, `pp3nn000`, `pr000000`, `pr0cn000`, `pr0cp000`, `pr0cs0`, `pr0cs000`, `pr0ms000`, `pt000000`, `pt0cs000`, `pt0fp000`, `pt0fs000`, `pt0mp000`, `pt0ms000`, `px1fp0p0`, `px1fs0p0`, `px1ms0p0`, `px3cp0p0`, `px3cs0p0`, `px3fp0s0`, `px3fs000`, `px3fs0s0`, `px3mp000`, `px3ms000`, `rg`, `rn`, `spcmp`, `spcms`, `sps00`, `vag0000`, `vaic1p0`, `vaic3p0`, `vaic3s0`, `vaif1p0`, `vaif1s0`, `vaif2p0`, `vaif3p0`, `vaif3s0`, `vaii1p0`, `vaii1s0`, `vaii3p0`, `vaii3s0`, `vaip1p0`, `vaip1s0`, `vaip2p0`, `vaip2s0`, `vaip3p0`, `vaip3s0`, `van0000`, `vap00sm`, `vasi100`, `vasi1p0`, `vasi3p0`, `vasi3s0`, `vasp1p0`, `vasp3p0`, `vasp3s0`, `vm00000`, `vmg0000`, `vmic1p0`, `vmic1s0`, `vmic3p0`, `vmic3s0`, `vmif1p0`, `vmif1s0`, `vmif2p0`, `vmif3p0`, `vmif3s0`, `vmii1p0`, `vmii1s0`, `vmii3p0`, `vmii3s0`, `vmip1p0`, `vmip1s0`, `vmip2p0`, `vmip2s0`, `vmip3p0`, `vmip3s0`, `vmis3p0`, `vmis3s0`, `vmm01p0`, `vmm02s0`, `vmm03p0`, `vmm03s0`, `vmn0000`, `vmp0000`, `vmp00fs`, `vmp00mp`, `vmp00ms`, `vmp00pf`, `vmp00pm`, `vmp00sf`, `vmp00sm`, `vmsi1p0`, `vmsi1s0`, `vmsi3p0`, `vmsi3s0`, `vmsp1p0`, `vmsp1s0`, `vmsp2p0`, `vmsp2s0`, `vmsp3p0`, `vmsp3s0`, `vsg0000`, `vsic3p0`, `vsic3s0`, `vsif3p0`, `vsif3s0`, `vsii1p0`, `vsii1s0`, `vsii3p0`, `vsii3s0`, `vsip1p0`, `vsip1s0`, `vsip2s0`, `vsip3p0`, `vsip3s0`, `vsis3p0`, `vsis3s0`, `vsm03p0`, `vsm03s0`, `vsn0000`, `vsp00sm`, `vssi3p0`, `vssi3s0`, `vssp1p0`, `vssp3p0`, `vssp3s0`, `zm`, `zp` |
97
+ | **`morphologizer`** | `Definite=Def\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `POS=PROPN`, `POS=PUNCT\|PunctSide=Ini\|PunctType=Brck`, `POS=PUNCT\|PunctSide=Fin\|PunctType=Brck`, `Mood=Ind\|Number=Sing\|POS=AUX\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Gender=Masc\|Number=Sing\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Definite=Def\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Art`, `Gender=Fem\|Number=Sing\|POS=NOUN`, `POS=ADP`, `NumType=Card\|Number=Plur\|POS=NUM`, `Gender=Masc\|Number=Plur\|POS=NOUN`, `Number=Sing\|POS=ADJ`, `POS=CCONJ`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Ind`, `NumForm=Digit\|NumType=Card\|POS=NUM`, `NumForm=Digit\|POS=NOUN`, `Gender=Masc\|Number=Plur\|POS=ADJ`, `POS=PUNCT\|PunctType=Comm`, `POS=AUX\|VerbForm=Inf`, `Case=Acc,Dat\|POS=PRON\|Person=3\|PrepCase=Npr\|PronType=Prs\|Reflex=Yes`, `Definite=Def\|Gender=Masc\|Number=Plur\|POS=DET\|PronType=Art`, `POS=PRON\|PronType=Rel`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=3\|Tense=Imp\|VerbForm=Fin`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Art`, `Gender=Fem\|Number=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Fem\|Number=Plur\|POS=DET\|PronType=Art`, `Gender=Fem\|Number=Plur\|POS=NOUN`, `Gender=Fem\|Number=Plur\|POS=ADJ`, `POS=VERB\|VerbForm=Inf`, `Case=Acc,Dat\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Number=Plur\|POS=ADJ`, `POS=PUNCT\|PunctType=Peri`, `Number=Sing\|POS=PRON\|PronType=Rel`, `Gender=Masc\|Number=Sing\|POS=NOUN`, `Mood=Imp\|Number=Sing\|POS=VERB\|Person=2\|VerbForm=Fin`, `Gender=Masc\|Number=Plur\|POS=ADJ\|VerbForm=Part`, `POS=SCONJ`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Gender=Masc\|Number=Plur\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Definite=Def\|Number=Sing\|POS=DET\|PronType=Art`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Ind`, `Gender=Fem\|Number=Plur\|POS=ADJ\|VerbForm=Part`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Dem`, `POS=VERB\|VerbForm=Ger`, `POS=NOUN`, `Gender=Fem\|NumType=Card\|Number=Sing\|POS=NUM`, `Gender=Fem\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Gender=Fem\|NumType=Ord\|Number=Plur\|POS=ADJ`, `POS=PUNCT\|PunctType=Quot`, `Gender=Masc\|Number=Sing\|POS=ADJ`, `Gender=Masc\|Number=Sing\|POS=ADJ\|VerbForm=Part`, `Mood=Ind\|Number=Sing\|POS=VERB\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Dem`, `POS=ADV\|Polarity=Neg`, `POS=ADV`, `Number=Sing\|POS=PRON\|PronType=Dem`, `Number=Sing\|POS=NOUN`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Number=Plur\|POS=NOUN`, `Mood=Sub\|Number=Plur\|POS=VERB\|Person=3\|Tense=Imp\|VerbForm=Fin`, `Gender=Fem\|Number=Sing\|POS=ADJ`, `Mood=Sub\|Number=Sing\|POS=VERB\|Person=1\|Tense=Pres\|VerbForm=Fin`, `Gender=Masc\|Number=Sing\|POS=PRON\|PronType=Tot`, `Case=Loc\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Fem\|NumType=Ord\|Number=Sing\|POS=ADJ`, `Degree=Cmp\|POS=ADV`, `Gender=Fem\|Number=Plur\|POS=DET\|PronType=Art`, `Gender=Fem\|Number=Plur\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Mood=Ind\|Number=Sing\|POS=VERB\|Person=3\|Tense=Fut\|VerbForm=Fin`, `Gender=Masc\|NumType=Ord\|Number=Sing\|POS=ADJ`, `Mood=Ind\|Number=Sing\|POS=AUX\|Person=3\|Tense=Fut\|VerbForm=Fin`, `NumType=Card\|POS=NUM`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=3\|Tense=Fut\|VerbForm=Fin`, `Number=Sing\|POS=PRON\|PronType=Ind`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `Number=Plur\|POS=DET\|PronType=Ind`, `Mood=Sub\|Number=Plur\|POS=VERB\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Gender=Masc\|Number=Plur\|POS=DET\|PronType=Dem`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=3\|Tense=Fut\|VerbForm=Fin`, `Gender=Masc\|NumType=Card\|Number=Sing\|POS=NUM`, `Mood=Sub\|Number=Plur\|POS=AUX\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Case=Acc\|Gender=Fem\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Number=Sing\|POS=DET\|PronType=Ind`, `POS=PUNCT`, `Number=Sing\|POS=DET\|PronType=Rel`, `Case=Gen\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Fem\|NumType=Card\|Number=Plur\|POS=NUM`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=1\|Tense=Pres\|VerbForm=Fin`, `POS=DET\|PronType=Ind`, `Case=Acc\|Gender=Neut\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Case=Acc,Dat\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Degree=Cmp\|Number=Sing\|POS=ADJ`, `Gender=Masc\|Number=Plur\|POS=PRON\|PronType=Ind`, `Gender=Fem\|Number=Plur\|POS=DET\|PronType=Dem`, `Gender=Masc\|Number=Plur\|POS=DET\|PronType=Art`, `Gender=Masc\|Number=Plur\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Case=Acc\|Gender=Fem,Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Fem\|Number=Sing\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Gender=Masc\|Number=Sing\|POS=PRON\|PronType=Ind`, `Gender=Fem\|Number=Plur\|POS=PRON\|PronType=Ind`, `Mood=Sub\|Number=Sing\|POS=VERB\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Number=Plur\|POS=PRON\|PronType=Rel`, `Gender=Masc\|Number=Plur\|POS=DET\|PronType=Int`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=3\|Tense=Imp\|VerbForm=Fin`, `AdvType=Tim\|POS=NOUN`, `Gender=Masc\|Number=Plur\|POS=DET\|PronType=Ind`, `Gender=Fem\|Number=Plur\|POS=DET\|PronType=Ind`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Int`, `Mood=Cnd\|Number=Sing\|POS=AUX\|Person=3\|VerbForm=Fin`, `Mood=Ind\|Number=Sing\|POS=VERB\|Person=3\|Tense=Imp\|VerbForm=Fin`, `Number=Sing\|POS=DET\|PronType=Art`, `Gender=Masc\|Number=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Case=Acc\|Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Masc\|Number=Sing\|POS=PRON\|PronType=Int`, `POS=PUNCT\|PunctType=Semi`, `Mood=Cnd\|Number=Plur\|POS=AUX\|Person=3\|VerbForm=Fin`, `Case=Dat\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Masc\|NumType=Card\|Number=Plur\|POS=NUM`, `Mood=Ind\|Number=Sing\|POS=AUX\|Person=3\|Tense=Imp\|VerbForm=Fin`, `Gender=Fem\|Number=Sing\|POS=PRON\|PronType=Ind`, `Mood=Sub\|Number=Sing\|POS=AUX\|Person=3\|Tense=Imp\|VerbForm=Fin`, `NumForm=Digit\|POS=SYM`, `Gender=Masc\|Number=Sing\|POS=AUX\|Tense=Past\|VerbForm=Part`, `Gender=Fem\|Number=Sing\|POS=PRON\|PronType=Int`, `Gender=Fem\|Number=Sing\|POS=DET\|PronType=Int`, `POS=PRON\|PronType=Int`, `Gender=Fem\|Number=Plur\|POS=DET\|PronType=Int`, `Mood=Cnd\|Number=Sing\|POS=VERB\|Person=3\|VerbForm=Fin`, `Mood=Cnd\|Number=Plur\|POS=VERB\|Person=3\|VerbForm=Fin`, `POS=PART`, `Gender=Fem\|Number=Sing\|POS=PRON\|PronType=Dem`, `Gender=Masc\|Number=Sing\|POS=DET\|PronType=Tot`, `Gender=Masc\|Number=Plur\|POS=PRON\|PronType=Dem`, `POS=ADJ`, `Gender=Masc\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Degree=Cmp\|Number=Plur\|POS=ADJ`, `POS=PUNCT\|PunctType=Dash`, `Mood=Sub\|Number=Sing\|POS=AUX\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Case=Acc\|Gender=Fem\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Mood=Sub\|Number=Sing\|POS=VERB\|Person=3\|Tense=Imp\|VerbForm=Fin`, `Gender=Fem\|Number=Plur\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Gender=Fem\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Gender=Masc\|POS=NOUN`, `Mood=Ind\|Number=Sing\|POS=VERB\|Person=3\|Tense=Past\|VerbForm=Fin`, `Gender=Fem\|Number=Plur\|POS=PRON\|PronType=Int`, `Gender=Masc\|NumType=Ord\|Number=Plur\|POS=ADJ`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=1\|Tense=Fut\|VerbForm=Fin`, `POS=PUNCT\|PunctType=Colo`, `Gender=Masc\|NumType=Card\|POS=NUM`, `Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Number=Sing\|POS=PRON\|PronType=Int`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=1\|Tense=Fut\|VerbForm=Fin`, `Mood=Imp\|Number=Sing\|POS=VERB\|Person=3\|VerbForm=Fin`, `Gender=Fem\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Gender=Masc\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `POS=AUX\|VerbForm=Ger`, `Gender=Fem\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Mood=Imp\|Number=Sing\|POS=AUX\|Person=3\|VerbForm=Fin`, `Number=Plur\|POS=PRON\|PronType=Ind`, `Gender=Masc\|Number=Sing\|POS=PRON\|PronType=Dem`, `Case=Acc,Dat\|Number=Sing\|POS=PRON\|Person=2\|Polite=Infm\|PrepCase=Npr\|PronType=Prs`, `Gender=Masc\|Number=Plur\|POS=PRON\|PronType=Int`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=1\|Tense=Pres\|VerbForm=Fin`, `NumForm=Digit\|NumType=Frac\|POS=NUM`, `Gender=Fem\|Number=Plur\|POS=PRON\|PronType=Dem`, `Gender=Fem\|POS=NOUN`, `Case=Acc,Dat\|Number=Sing\|POS=PRON\|Person=1\|PrepCase=Npr\|PronType=Prs`, `Mood=Sub\|Number=Plur\|POS=VERB\|Person=2\|Tense=Pres\|VerbForm=Fin`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=2\|Tense=Fut\|VerbForm=Fin`, `Mood=Sub\|Number=Plur\|POS=AUX\|Person=1\|Tense=Pres\|VerbForm=Fin`, `Mood=Sub\|Number=Plur\|POS=AUX\|Person=3\|Tense=Imp\|VerbForm=Fin`, `Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Mood=Ind\|Number=Sing\|POS=VERB\|Person=1\|Tense=Pres\|VerbForm=Fin`, `Case=Nom\|Number=Sing\|POS=PRON\|Person=2\|Polite=Infm\|PronType=Prs`, `POS=X`, `Mood=Cnd\|Number=Plur\|POS=AUX\|Person=1\|VerbForm=Fin`, `Number=Sing\|POS=DET\|PronType=Dem`, `Mood=Ind\|Number=Sing\|POS=VERB\|Person=1\|Tense=Fut\|VerbForm=Fin`, `Mood=Ind\|Number=Sing\|POS=AUX\|Person=1\|Tense=Pres\|VerbForm=Fin`, `POS=DET\|PronType=Art`, `Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `NumType=Ord\|Number=Sing\|POS=ADJ`, `Number=Plur\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Number=Plur\|POS=PRON\|PronType=Dem`, `Mood=Imp\|Number=Plur\|POS=VERB\|Person=1\|VerbForm=Fin`, `POS=PRON\|PronType=Ind`, `POS=SYM`, `Mood=Ind\|Number=Sing\|POS=VERB\|Person=2\|Tense=Pres\|VerbForm=Fin`, `Mood=Imp\|Number=Plur\|POS=VERB\|Person=3\|VerbForm=Fin`, `POS=VERB\|VerbForm=Fin`, `Case=Nom\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Acc\|Number=Sing\|POS=PRON\|Person=1\|PrepCase=Pre\|PronType=Prs`, `Mood=Ind\|Number=Sing\|POS=AUX\|Person=2\|Tense=Pres\|VerbForm=Fin`, `NumForm=Digit\|NumType=Frac\|POS=SYM`, `NumType=Card\|Number=Sing\|POS=NUM`, `POS=PUNCT\|PunctSide=Ini\|PunctType=Qest`, `POS=PUNCT\|PunctSide=Fin\|PunctType=Qest`, `NumForm=Digit\|NumType=Ord\|POS=ADJ`, `Foreign=Yes\|POS=PRON\|PronType=Int`, `Foreign=Yes\|Mood=Ind\|POS=VERB\|VerbForm=Fin`, `Foreign=Yes\|POS=ADP`, `Gender=Masc\|Number=Sing\|POS=PROPN`, `Case=Acc\|POS=PRON\|Person=3\|PrepCase=Pre\|PronType=Prs\|Reflex=Yes`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=2\|Tense=Pres\|VerbForm=Fin`, `POS=PUNCT\|PunctSide=Ini\|PunctType=Excl`, `POS=PUNCT\|PunctSide=Fin\|PunctType=Excl`, `Gender=Masc\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Mood=Cnd\|Number=Sing\|POS=VERB\|Person=1\|VerbForm=Fin`, `Mood=Ind\|Number=Sing\|POS=VERB\|Person=1\|Tense=Imp\|VerbForm=Fin`, `Gender=Masc\|Number=Plur\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=NUM`, `Mood=Imp\|Number=Plur\|POS=AUX\|Person=3\|VerbForm=Fin`, `Case=Nom\|POS=PRON\|Person=3\|PronType=Prs`, `Mood=Cnd\|Number=Sing\|POS=AUX\|Person=1\|VerbForm=Fin`, `Number=Plur\|POS=PRON\|Person=2\|Polite=Form\|PronType=Prs`, `Mood=Sub\|POS=AUX\|Person=1\|Tense=Imp\|VerbForm=Fin`, `POS=PUNCT\|PunctSide=Ini\|PunctType=Comm`, `POS=PUNCT\|PunctSide=Fin\|PunctType=Comm`, `Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=2\|Tense=Pres\|VerbForm=Fin`, `Case=Acc,Dat\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Mood=Cnd\|Number=Plur\|POS=VERB\|Person=1\|VerbForm=Fin`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=1\|Tense=Imp\|VerbForm=Fin`, `Gender=Masc\|Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=1\|Tense=Imp\|VerbForm=Fin`, `Mood=Sub\|Number=Plur\|POS=VERB\|Person=1\|Tense=Pres\|VerbForm=Fin`, `Definite=Ind\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `Number=Sing\|POS=PRON\|Person=2\|Polite=Form\|PronType=Prs`, `Gender=Masc\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `POS=VERB\|Tense=Past\|VerbForm=Part`, `Mood=Ind\|Number=Sing\|POS=AUX\|Person=3\|Tense=Past\|VerbForm=Fin`, `Foreign=Yes\|POS=NOUN`, `Definite=Def\|Foreign=Yes\|Gender=Masc\|Number=Sing\|POS=DET\|PronType=Art`, `Foreign=Yes\|POS=VERB`, `Foreign=Yes\|POS=ADJ`, `Foreign=Yes\|POS=DET`, `Foreign=Yes\|POS=ADV`, `Definite=Ind\|Gender=Fem\|Number=Plur\|POS=DET\|PronType=Art`, `POS=INTJ`, `Mood=Ind\|Number=Sing\|POS=AUX\|Person=1\|Tense=Imp\|VerbForm=Fin`, `Mood=Sub\|Number=Sing\|POS=VERB\|Person=2\|Tense=Pres\|VerbForm=Fin`, `Case=Acc\|POS=PRON\|Person=3\|PronType=Prs\|Reflex=Yes`, `AdvType=Tim\|POS=SYM`, `Gender=Fem\|Number=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `Definite=Ind\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Art`, `AdvType=Tim\|Degree=Cmp\|POS=ADV`, `Case=Acc\|Number=Sing\|POS=PRON\|Person=2\|Polite=Infm\|PrepCase=Pre\|PronType=Prs`, `Mood=Sub\|Number=Plur\|POS=VERB\|Person=1\|Tense=Imp\|VerbForm=Fin`, `Degree=Cmp\|POS=ADJ`, `POS=DET`, `Gender=Masc\|Number=Sing\|Number[psor]=Plur\|POS=PRON\|Person=1\|Poss=Yes\|PronType=Prs`, `Number=Plur\|Number[psor]=Plur\|POS=PRON\|Person=1\|Poss=Yes\|PronType=Prs`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=2\|Tense=Fut\|VerbForm=Fin`, `Mood=Sub\|Number=Sing\|POS=AUX\|Person=1\|Tense=Pres\|VerbForm=Fin`, `Gender=Masc\|POS=SYM`, `Mood=Ind\|Number=Plur\|POS=VERB\|Person=3\|Tense=Past\|VerbForm=Fin`, `Mood=Sub\|Number=Sing\|POS=VERB\|Person=1\|Tense=Imp\|VerbForm=Fin`, `POS=DET\|PronType=Rel`, `Gender=Fem\|NumType=Card\|POS=NUM`, `Mood=Ind\|Number=Plur\|POS=AUX\|Person=3\|Tense=Past\|VerbForm=Fin`, `Mood=Sub\|Number=Plur\|POS=AUX\|Person=1\|Tense=Imp\|VerbForm=Fin`, `POS=AUX\|Tense=Past\|VerbForm=Part`, `Foreign=Yes\|Mood=Ind\|Number=Sing\|POS=AUX\|Person=3\|Tense=Pres\|VerbForm=Fin`, `Foreign=Yes\|Gender=Masc\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Foreign=Yes\|POS=SCONJ`, `Foreign=Yes\|Gender=Fem\|Number=Sing\|POS=DET\|PronType=Art`, `Mood=Ind\|Number=Sing\|POS=AUX\|Person=1\|Tense=Fut\|VerbForm=Fin`, `Number=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Gender=Fem\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Gender=Fem\|Number=Sing\|Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `Gender=Masc\|Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Definite=Ind\|Number=Sing\|POS=DET\|PronType=Art`, `Gender=Fem\|Number=Plur\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `Gender=Fem\|Number=Sing\|POS=PROPN`, `Number=Plur\|POS=DET\|PronType=Dem`, `Gender=Masc\|Number=Sing\|POS=PRON\|PronType=Rel` |
98
+ | **`parser`** | `ROOT`, `acl`, `advcl`, `advmod`, `amod`, `appos`, `aux`, `case`, `cc`, `ccomp`, `compound`, `conj`, `cop`, `csubj`, `dep`, `det`, `expl:pass`, `fixed`, `flat`, `iobj`, `mark`, `nmod`, `nsubj`, `nummod`, `obj`, `obl`, `parataxis`, `punct`, `xcomp` |
99
+ | **`ner`** | `LOC`, `MISC`, `ORG`, `PER` |
100
+
101
+ </details>
102
+
103
+ ### Accuracy
104
+
105
+ | Type | Score |
106
+ | --- | --- |
107
+ | `TAG_ACC` | 97.52 |
108
+ | `POS_ACC` | 99.24 |
109
+ | `MORPH_ACC` | 98.96 |
110
+ | `LEMMA_ACC` | 96.48 |
111
+ | `DEP_UAS` | 95.25 |
112
+ | `DEP_LAS` | 93.46 |
113
+ | `SENTS_P` | 99.71 |
114
+ | `SENTS_R` | 99.77 |
115
+ | `SENTS_F` | 99.74 |
116
+ | `ENTS_F` | 89.77 |
117
+ | `ENTS_P` | 89.94 |
118
+ | `ENTS_R` | 89.60 |
119
+ | `TRANSFORMER_LOSS` | 13983585.54 |
120
+ | `TAGGER_LOSS` | 637551.95 |
121
+ | `MORPHOLOGIZER_LOSS` | 349270.61 |
122
+ | `PARSER_LOSS` | 3321140.98 |
123
+ | `NER_LOSS` | 89131.89 |
ca_bsc_core_trf-any-py3-none-any.whl ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7acad17dbc0010dad3bccc233f991432a927394f93639c26d44c89bc1af39a31
3
+ size 1312635263
config.cfg ADDED
@@ -0,0 +1,227 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [paths]
2
+ train = "corpus/ANCORA_ca_UD11/train.spacy"
3
+ dev = "corpus/ANCORA_ca_UD11/dev.spacy"
4
+ vectors = null
5
+ init_tok2vec = null
6
+
7
+ [system]
8
+ gpu_allocator = "pytorch"
9
+ seed = 0
10
+
11
+ [nlp]
12
+ lang = "ca"
13
+ pipeline = ["transformer","tagger","morphologizer","lemmatizer","parser","ner"]
14
+ batch_size = 16
15
+ disabled = []
16
+ before_creation = null
17
+ after_creation = null
18
+ after_pipeline_creation = null
19
+ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
20
+
21
+ [components]
22
+
23
+ [components.lemmatizer]
24
+ factory = "lemmatizer"
25
+ mode = "rule"
26
+ model = null
27
+ overwrite = false
28
+ scorer = {"@scorers":"spacy.lemmatizer_scorer.v1"}
29
+
30
+ [components.morphologizer]
31
+ factory = "morphologizer"
32
+ extend = false
33
+ overwrite = true
34
+ scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
35
+
36
+ [components.morphologizer.model]
37
+ @architectures = "spacy.Tagger.v2"
38
+ nO = null
39
+ normalize = false
40
+
41
+ [components.morphologizer.model.tok2vec]
42
+ @architectures = "spacy-transformers.TransformerListener.v1"
43
+ grad_factor = 1.0
44
+ pooling = {"@layers":"reduce_mean.v1"}
45
+ upstream = "*"
46
+
47
+ [components.ner]
48
+ factory = "ner"
49
+ incorrect_spans_key = null
50
+ moves = null
51
+ scorer = {"@scorers":"spacy.ner_scorer.v1"}
52
+ update_with_oracle_cut_size = 100
53
+
54
+ [components.ner.model]
55
+ @architectures = "spacy.TransitionBasedParser.v2"
56
+ state_type = "ner"
57
+ extra_state_tokens = false
58
+ hidden_width = 64
59
+ maxout_pieces = 2
60
+ use_upper = false
61
+ nO = null
62
+
63
+ [components.ner.model.tok2vec]
64
+ @architectures = "spacy-transformers.TransformerListener.v1"
65
+ grad_factor = 1.0
66
+ pooling = {"@layers":"reduce_mean.v1"}
67
+ upstream = "*"
68
+
69
+ [components.parser]
70
+ factory = "parser"
71
+ learn_tokens = false
72
+ min_action_freq = 30
73
+ moves = null
74
+ scorer = {"@scorers":"spacy.parser_scorer.v1"}
75
+ update_with_oracle_cut_size = 100
76
+
77
+ [components.parser.model]
78
+ @architectures = "spacy.TransitionBasedParser.v2"
79
+ state_type = "parser"
80
+ extra_state_tokens = false
81
+ hidden_width = 128
82
+ maxout_pieces = 3
83
+ use_upper = false
84
+ nO = null
85
+
86
+ [components.parser.model.tok2vec]
87
+ @architectures = "spacy-transformers.TransformerListener.v1"
88
+ grad_factor = 1.0
89
+ pooling = {"@layers":"reduce_mean.v1"}
90
+ upstream = "*"
91
+
92
+ [components.tagger]
93
+ factory = "tagger"
94
+ neg_prefix = "!"
95
+ overwrite = false
96
+ scorer = {"@scorers":"spacy.tagger_scorer.v1"}
97
+
98
+ [components.tagger.model]
99
+ @architectures = "spacy.Tagger.v2"
100
+ nO = null
101
+ normalize = false
102
+
103
+ [components.tagger.model.tok2vec]
104
+ @architectures = "spacy-transformers.TransformerListener.v1"
105
+ grad_factor = 1.0
106
+ pooling = {"@layers":"reduce_mean.v1"}
107
+ upstream = "*"
108
+
109
+ [components.transformer]
110
+ factory = "transformer"
111
+ max_batch_items = 4096
112
+ set_extra_annotations = {"@annotation_setters":"spacy-transformers.null_annotation_setter.v1"}
113
+
114
+ [components.transformer.model]
115
+ @architectures = "spacy-transformers.TransformerModel.v3"
116
+ name = "./huggingfaces/roberta-large-ca-v2"
117
+ mixed_precision = false
118
+
119
+ [components.transformer.model.get_spans]
120
+ @span_getters = "spacy-transformers.strided_spans.v1"
121
+ window = 128
122
+ stride = 96
123
+
124
+ [components.transformer.model.grad_scaler_config]
125
+
126
+ [components.transformer.model.tokenizer_config]
127
+ use_fast = true
128
+
129
+ [components.transformer.model.transformer_config]
130
+
131
+ [corpora]
132
+
133
+ [corpora.dev]
134
+ @readers = "spacy.Corpus.v1"
135
+ path = ${paths.dev}
136
+ max_length = 0
137
+ gold_preproc = false
138
+ limit = 0
139
+ augmenter = null
140
+
141
+ [corpora.train]
142
+ @readers = "spacy.Corpus.v1"
143
+ path = ${paths.train}
144
+ max_length = 0
145
+ gold_preproc = false
146
+ limit = 0
147
+ augmenter = null
148
+
149
+ [training]
150
+ accumulate_gradient = 3
151
+ dev_corpus = "corpora.dev"
152
+ train_corpus = "corpora.train"
153
+ seed = ${system.seed}
154
+ gpu_allocator = ${system.gpu_allocator}
155
+ dropout = 0.1
156
+ patience = 1600
157
+ max_epochs = 0
158
+ max_steps = 35000
159
+ eval_frequency = 800
160
+ frozen_components = []
161
+ annotating_components = []
162
+ before_to_disk = null
163
+
164
+ [training.batcher]
165
+ @batchers = "spacy.batch_by_padded.v1"
166
+ discard_oversize = true
167
+ size = 1000
168
+ buffer = 512
169
+ get_length = null
170
+
171
+ [training.logger]
172
+ @loggers = "spacy.ConsoleLogger.v1"
173
+ progress_bar = false
174
+
175
+ [training.optimizer]
176
+ @optimizers = "Adam.v1"
177
+ beta1 = 0.9
178
+ beta2 = 0.999
179
+ L2_is_weight_decay = true
180
+ L2 = 0.01
181
+ grad_clip = 1.0
182
+ use_averages = false
183
+ eps = 0.00000001
184
+
185
+ [training.optimizer.learn_rate]
186
+ @schedules = "warmup_linear.v1"
187
+ warmup_steps = 250
188
+ total_steps = 20000
189
+ initial_rate = 0.00005
190
+
191
+ [training.score_weights]
192
+ tag_acc = 0.2
193
+ pos_acc = 0.1
194
+ morph_acc = 0.1
195
+ morph_per_feat = null
196
+ lemma_acc = 0.2
197
+ dep_uas = 0.1
198
+ dep_las = 0.1
199
+ dep_las_per_type = null
200
+ sents_p = null
201
+ sents_r = null
202
+ sents_f = 0.0
203
+ ents_f = 0.2
204
+ ents_p = 0.0
205
+ ents_r = 0.0
206
+ ents_per_type = null
207
+
208
+ [pretraining]
209
+
210
+ [initialize]
211
+ vectors = ${paths.vectors}
212
+ init_tok2vec = ${paths.init_tok2vec}
213
+ vocab_data = null
214
+ lookups = null
215
+ before_init = null
216
+ after_init = null
217
+
218
+ [initialize.components]
219
+
220
+ [initialize.components.lemmatizer]
221
+
222
+ [initialize.components.lemmatizer.lookups]
223
+ @misc = "spacy.LookupsDataLoader.v1"
224
+ lang = ${nlp.lang}
225
+ tables = ["lemma_exc","lemma_index","lemma_lookup","lemma_rules"]
226
+
227
+ [initialize.tokenizer]
lemmatizer/lookups/lookups.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1894dc367bcd14eb7cd791f3eb1ee2f4474736c6dd85907c039661ee952e89f4
3
+ size 25931659
meta.json ADDED
@@ -0,0 +1,961 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "lang":"ca",
3
+ "name":"bsc_core_trf",
4
+ "version":"3.4.5",
5
+ "description":"testing new lemma dictionaries",
6
+ "author":"",
7
+ "email":"",
8
+ "url":"",
9
+ "license":"mit",
10
+ "spacy_version":">=3.4.1,<3.5.0",
11
+ "spacy_git_version":"Unknown",
12
+ "vectors":{
13
+ "width":0,
14
+ "vectors":0,
15
+ "keys":0,
16
+ "name":null
17
+ },
18
+ "labels":{
19
+ "transformer":[
20
+
21
+ ],
22
+ "tagger":[
23
+ "ADJ",
24
+ "ADP",
25
+ "ADV",
26
+ "AUX",
27
+ "CCONJ",
28
+ "DET",
29
+ "INTJ",
30
+ "NOUN",
31
+ "NUM",
32
+ "PART",
33
+ "PRON",
34
+ "PROPN",
35
+ "PUNCT",
36
+ "SCONJ",
37
+ "SYM",
38
+ "VERB",
39
+ "ao0cs0",
40
+ "ao0fp0",
41
+ "ao0fs0",
42
+ "ao0mp0",
43
+ "ao0ms0",
44
+ "aq0cn0",
45
+ "aq0cp0",
46
+ "aq0cp00",
47
+ "aq0cs0",
48
+ "aq0fp0",
49
+ "aq0fpp",
50
+ "aq0fs0",
51
+ "aq0fsp",
52
+ "aq0mp0",
53
+ "aq0mpp",
54
+ "aq0ms0",
55
+ "aq0msp",
56
+ "cc",
57
+ "cs",
58
+ "da0cs0",
59
+ "da0fp0",
60
+ "da0fs0",
61
+ "da0mp0",
62
+ "da0ms0",
63
+ "dd0cp0",
64
+ "dd0cs0",
65
+ "dd0fp0",
66
+ "dd0fs0",
67
+ "dd0mp0",
68
+ "dd0ms0",
69
+ "de0cn0",
70
+ "di0cn0",
71
+ "di0cp0",
72
+ "di0cs0",
73
+ "di0fp0",
74
+ "di0fs0",
75
+ "di0mp0",
76
+ "di0ms0",
77
+ "dn0cp0",
78
+ "dn0cs0",
79
+ "dn0fp0",
80
+ "dn0fs0",
81
+ "dn0mp0",
82
+ "dn0ms0",
83
+ "dp1cpp",
84
+ "dp1fpp",
85
+ "dp1fps",
86
+ "dp1fsp",
87
+ "dp1fss",
88
+ "dp1mpp",
89
+ "dp1mps",
90
+ "dp1msp",
91
+ "dp1mss",
92
+ "dp2fss",
93
+ "dp2mps",
94
+ "dp2mss",
95
+ "dp3fp0",
96
+ "dp3fs0",
97
+ "dp3mp0",
98
+ "dp3ms0",
99
+ "dr0cs0",
100
+ "dt0fp0",
101
+ "dt0fs0",
102
+ "dt0mp0",
103
+ "dt0ms0",
104
+ "faa",
105
+ "fat",
106
+ "fc",
107
+ "fca",
108
+ "fct",
109
+ "fd",
110
+ "fe",
111
+ "fg",
112
+ "fh",
113
+ "fia",
114
+ "fit",
115
+ "fp",
116
+ "fpa",
117
+ "fpt",
118
+ "fs",
119
+ "fx",
120
+ "fz",
121
+ "nc00000",
122
+ "nccn000",
123
+ "nccp000",
124
+ "nccs000",
125
+ "ncfn000",
126
+ "ncfp000",
127
+ "ncfs000",
128
+ "ncmn000",
129
+ "ncmp000",
130
+ "ncms000",
131
+ "np00000",
132
+ "np0000a",
133
+ "np0000d",
134
+ "np0000l",
135
+ "np0000o",
136
+ "np0000p",
137
+ "p0000000",
138
+ "p010p000",
139
+ "p010s000",
140
+ "p020p000",
141
+ "p020s000",
142
+ "p0300000",
143
+ "pd0cp000",
144
+ "pd0cs000",
145
+ "pd0fp000",
146
+ "pd0fs000",
147
+ "pd0mp000",
148
+ "pd0ms000",
149
+ "pd0ns000",
150
+ "pi0cn000",
151
+ "pi0cp000",
152
+ "pi0cs000",
153
+ "pi0fp000",
154
+ "pi0fs000",
155
+ "pi0mp0",
156
+ "pi0mp000",
157
+ "pi0ms000",
158
+ "pn0cp000",
159
+ "pn0cs000",
160
+ "pn0fp000",
161
+ "pn0fs000",
162
+ "pn0mp000",
163
+ "pn0ms000",
164
+ "pp1cp000",
165
+ "pp1cs000",
166
+ "pp1csn00",
167
+ "pp1cso00",
168
+ "pp2cp000",
169
+ "pp2cp00p",
170
+ "pp2cs000",
171
+ "pp2cs00p",
172
+ "pp3cn000",
173
+ "pp3cno00",
174
+ "pp3cp000",
175
+ "pp3csa00",
176
+ "pp3csd00",
177
+ "pp3fp000",
178
+ "pp3fpa00",
179
+ "pp3fs000",
180
+ "pp3fsa00",
181
+ "pp3mp000",
182
+ "pp3mpa00",
183
+ "pp3ms000",
184
+ "pp3msa00",
185
+ "pp3nn000",
186
+ "pr000000",
187
+ "pr0cn000",
188
+ "pr0cp000",
189
+ "pr0cs0",
190
+ "pr0cs000",
191
+ "pr0ms000",
192
+ "pt000000",
193
+ "pt0cs000",
194
+ "pt0fp000",
195
+ "pt0fs000",
196
+ "pt0mp000",
197
+ "pt0ms000",
198
+ "px1fp0p0",
199
+ "px1fs0p0",
200
+ "px1ms0p0",
201
+ "px3cp0p0",
202
+ "px3cs0p0",
203
+ "px3fp0s0",
204
+ "px3fs000",
205
+ "px3fs0s0",
206
+ "px3mp000",
207
+ "px3ms000",
208
+ "rg",
209
+ "rn",
210
+ "spcmp",
211
+ "spcms",
212
+ "sps00",
213
+ "vag0000",
214
+ "vaic1p0",
215
+ "vaic3p0",
216
+ "vaic3s0",
217
+ "vaif1p0",
218
+ "vaif1s0",
219
+ "vaif2p0",
220
+ "vaif3p0",
221
+ "vaif3s0",
222
+ "vaii1p0",
223
+ "vaii1s0",
224
+ "vaii3p0",
225
+ "vaii3s0",
226
+ "vaip1p0",
227
+ "vaip1s0",
228
+ "vaip2p0",
229
+ "vaip2s0",
230
+ "vaip3p0",
231
+ "vaip3s0",
232
+ "van0000",
233
+ "vap00sm",
234
+ "vasi100",
235
+ "vasi1p0",
236
+ "vasi3p0",
237
+ "vasi3s0",
238
+ "vasp1p0",
239
+ "vasp3p0",
240
+ "vasp3s0",
241
+ "vm00000",
242
+ "vmg0000",
243
+ "vmic1p0",
244
+ "vmic1s0",
245
+ "vmic3p0",
246
+ "vmic3s0",
247
+ "vmif1p0",
248
+ "vmif1s0",
249
+ "vmif2p0",
250
+ "vmif3p0",
251
+ "vmif3s0",
252
+ "vmii1p0",
253
+ "vmii1s0",
254
+ "vmii3p0",
255
+ "vmii3s0",
256
+ "vmip1p0",
257
+ "vmip1s0",
258
+ "vmip2p0",
259
+ "vmip2s0",
260
+ "vmip3p0",
261
+ "vmip3s0",
262
+ "vmis3p0",
263
+ "vmis3s0",
264
+ "vmm01p0",
265
+ "vmm02s0",
266
+ "vmm03p0",
267
+ "vmm03s0",
268
+ "vmn0000",
269
+ "vmp0000",
270
+ "vmp00fs",
271
+ "vmp00mp",
272
+ "vmp00ms",
273
+ "vmp00pf",
274
+ "vmp00pm",
275
+ "vmp00sf",
276
+ "vmp00sm",
277
+ "vmsi1p0",
278
+ "vmsi1s0",
279
+ "vmsi3p0",
280
+ "vmsi3s0",
281
+ "vmsp1p0",
282
+ "vmsp1s0",
283
+ "vmsp2p0",
284
+ "vmsp2s0",
285
+ "vmsp3p0",
286
+ "vmsp3s0",
287
+ "vsg0000",
288
+ "vsic3p0",
289
+ "vsic3s0",
290
+ "vsif3p0",
291
+ "vsif3s0",
292
+ "vsii1p0",
293
+ "vsii1s0",
294
+ "vsii3p0",
295
+ "vsii3s0",
296
+ "vsip1p0",
297
+ "vsip1s0",
298
+ "vsip2s0",
299
+ "vsip3p0",
300
+ "vsip3s0",
301
+ "vsis3p0",
302
+ "vsis3s0",
303
+ "vsm03p0",
304
+ "vsm03s0",
305
+ "vsn0000",
306
+ "vsp00sm",
307
+ "vssi3p0",
308
+ "vssi3s0",
309
+ "vssp1p0",
310
+ "vssp3p0",
311
+ "vssp3s0",
312
+ "zm",
313
+ "zp"
314
+ ],
315
+ "morphologizer":[
316
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Art",
317
+ "POS=PROPN",
318
+ "POS=PUNCT|PunctSide=Ini|PunctType=Brck",
319
+ "POS=PUNCT|PunctSide=Fin|PunctType=Brck",
320
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin",
321
+ "Gender=Masc|Number=Sing|POS=VERB|Tense=Past|VerbForm=Part",
322
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Art",
323
+ "Gender=Fem|Number=Sing|POS=NOUN",
324
+ "POS=ADP",
325
+ "NumType=Card|Number=Plur|POS=NUM",
326
+ "Gender=Masc|Number=Plur|POS=NOUN",
327
+ "Number=Sing|POS=ADJ",
328
+ "POS=CCONJ",
329
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Ind",
330
+ "NumForm=Digit|NumType=Card|POS=NUM",
331
+ "NumForm=Digit|POS=NOUN",
332
+ "Gender=Masc|Number=Plur|POS=ADJ",
333
+ "POS=PUNCT|PunctType=Comm",
334
+ "POS=AUX|VerbForm=Inf",
335
+ "Case=Acc,Dat|POS=PRON|Person=3|PrepCase=Npr|PronType=Prs|Reflex=Yes",
336
+ "Definite=Def|Gender=Masc|Number=Plur|POS=DET|PronType=Art",
337
+ "POS=PRON|PronType=Rel",
338
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin",
339
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Art",
340
+ "Gender=Fem|Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
341
+ "Definite=Def|Gender=Fem|Number=Plur|POS=DET|PronType=Art",
342
+ "Gender=Fem|Number=Plur|POS=NOUN",
343
+ "Gender=Fem|Number=Plur|POS=ADJ",
344
+ "POS=VERB|VerbForm=Inf",
345
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=3|PronType=Prs",
346
+ "Number=Plur|POS=ADJ",
347
+ "POS=PUNCT|PunctType=Peri",
348
+ "Number=Sing|POS=PRON|PronType=Rel",
349
+ "Gender=Masc|Number=Sing|POS=NOUN",
350
+ "Mood=Imp|Number=Sing|POS=VERB|Person=2|VerbForm=Fin",
351
+ "Gender=Masc|Number=Plur|POS=ADJ|VerbForm=Part",
352
+ "POS=SCONJ",
353
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin",
354
+ "Gender=Masc|Number=Plur|POS=VERB|Tense=Past|VerbForm=Part",
355
+ "Definite=Def|Number=Sing|POS=DET|PronType=Art",
356
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Ind",
357
+ "Gender=Fem|Number=Plur|POS=ADJ|VerbForm=Part",
358
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Dem",
359
+ "POS=VERB|VerbForm=Ger",
360
+ "POS=NOUN",
361
+ "Gender=Fem|NumType=Card|Number=Sing|POS=NUM",
362
+ "Gender=Fem|Number=Sing|POS=ADJ|VerbForm=Part",
363
+ "Gender=Fem|NumType=Ord|Number=Plur|POS=ADJ",
364
+ "POS=PUNCT|PunctType=Quot",
365
+ "Gender=Masc|Number=Sing|POS=ADJ",
366
+ "Gender=Masc|Number=Sing|POS=ADJ|VerbForm=Part",
367
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin",
368
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Dem",
369
+ "POS=ADV|Polarity=Neg",
370
+ "POS=ADV",
371
+ "Number=Sing|POS=PRON|PronType=Dem",
372
+ "Number=Sing|POS=NOUN",
373
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin",
374
+ "Number=Plur|POS=NOUN",
375
+ "Mood=Sub|Number=Plur|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin",
376
+ "Gender=Fem|Number=Sing|POS=ADJ",
377
+ "Mood=Sub|Number=Sing|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin",
378
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Tot",
379
+ "Case=Loc|POS=PRON|Person=3|PronType=Prs",
380
+ "Gender=Fem|NumType=Ord|Number=Sing|POS=ADJ",
381
+ "Degree=Cmp|POS=ADV",
382
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Art",
383
+ "Gender=Fem|Number=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs",
384
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Fut|VerbForm=Fin",
385
+ "Gender=Masc|NumType=Ord|Number=Sing|POS=ADJ",
386
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Fut|VerbForm=Fin",
387
+ "NumType=Card|POS=NUM",
388
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Fut|VerbForm=Fin",
389
+ "Number=Sing|POS=PRON|PronType=Ind",
390
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Art",
391
+ "Number=Plur|POS=DET|PronType=Ind",
392
+ "Mood=Sub|Number=Plur|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin",
393
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Dem",
394
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Fut|VerbForm=Fin",
395
+ "Gender=Masc|NumType=Card|Number=Sing|POS=NUM",
396
+ "Mood=Sub|Number=Plur|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin",
397
+ "Case=Acc|Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs",
398
+ "Number=Sing|POS=DET|PronType=Ind",
399
+ "POS=PUNCT",
400
+ "Number=Sing|POS=DET|PronType=Rel",
401
+ "Case=Gen|POS=PRON|Person=3|PronType=Prs",
402
+ "Gender=Fem|NumType=Card|Number=Plur|POS=NUM",
403
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin",
404
+ "POS=DET|PronType=Ind",
405
+ "Case=Acc|Gender=Neut|Number=Sing|POS=PRON|Person=3|PronType=Prs",
406
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=1|PronType=Prs",
407
+ "Degree=Cmp|Number=Sing|POS=ADJ",
408
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Ind",
409
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Dem",
410
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Art",
411
+ "Gender=Masc|Number=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs",
412
+ "Case=Acc|Gender=Fem,Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs",
413
+ "Gender=Fem|Number=Sing|POS=VERB|Tense=Past|VerbForm=Part",
414
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Ind",
415
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Ind",
416
+ "Mood=Sub|Number=Sing|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin",
417
+ "Number=Plur|POS=PRON|PronType=Rel",
418
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Int",
419
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin",
420
+ "AdvType=Tim|POS=NOUN",
421
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Ind",
422
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Ind",
423
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Int",
424
+ "Mood=Cnd|Number=Sing|POS=AUX|Person=3|VerbForm=Fin",
425
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin",
426
+ "Number=Sing|POS=DET|PronType=Art",
427
+ "Gender=Masc|Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
428
+ "Case=Acc|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs",
429
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Int",
430
+ "POS=PUNCT|PunctType=Semi",
431
+ "Mood=Cnd|Number=Plur|POS=AUX|Person=3|VerbForm=Fin",
432
+ "Case=Dat|Number=Sing|POS=PRON|Person=3|PronType=Prs",
433
+ "Gender=Masc|NumType=Card|Number=Plur|POS=NUM",
434
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin",
435
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Ind",
436
+ "Mood=Sub|Number=Sing|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin",
437
+ "NumForm=Digit|POS=SYM",
438
+ "Gender=Masc|Number=Sing|POS=AUX|Tense=Past|VerbForm=Part",
439
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Int",
440
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Int",
441
+ "POS=PRON|PronType=Int",
442
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Int",
443
+ "Mood=Cnd|Number=Sing|POS=VERB|Person=3|VerbForm=Fin",
444
+ "Mood=Cnd|Number=Plur|POS=VERB|Person=3|VerbForm=Fin",
445
+ "POS=PART",
446
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Dem",
447
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Tot",
448
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Dem",
449
+ "POS=ADJ",
450
+ "Gender=Masc|Number=Plur|POS=PRON|Person=3|PronType=Prs",
451
+ "Degree=Cmp|Number=Plur|POS=ADJ",
452
+ "POS=PUNCT|PunctType=Dash",
453
+ "Mood=Sub|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin",
454
+ "Case=Acc|Gender=Fem|Number=Plur|POS=PRON|Person=3|PronType=Prs",
455
+ "Mood=Sub|Number=Sing|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin",
456
+ "Gender=Fem|Number=Plur|POS=VERB|Tense=Past|VerbForm=Part",
457
+ "Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs",
458
+ "Gender=Masc|POS=NOUN",
459
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Past|VerbForm=Fin",
460
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Int",
461
+ "Gender=Masc|NumType=Ord|Number=Plur|POS=ADJ",
462
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Fut|VerbForm=Fin",
463
+ "POS=PUNCT|PunctType=Colo",
464
+ "Gender=Masc|NumType=Card|POS=NUM",
465
+ "Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs",
466
+ "Number=Sing|POS=PRON|PronType=Int",
467
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Fut|VerbForm=Fin",
468
+ "Mood=Imp|Number=Sing|POS=VERB|Person=3|VerbForm=Fin",
469
+ "Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs",
470
+ "Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs",
471
+ "POS=AUX|VerbForm=Ger",
472
+ "Gender=Fem|Number=Plur|POS=PRON|Person=3|PronType=Prs",
473
+ "Mood=Imp|Number=Sing|POS=AUX|Person=3|VerbForm=Fin",
474
+ "Number=Plur|POS=PRON|PronType=Ind",
475
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Dem",
476
+ "Case=Acc,Dat|Number=Sing|POS=PRON|Person=2|Polite=Infm|PrepCase=Npr|PronType=Prs",
477
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Int",
478
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin",
479
+ "NumForm=Digit|NumType=Frac|POS=NUM",
480
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Dem",
481
+ "Gender=Fem|POS=NOUN",
482
+ "Case=Acc,Dat|Number=Sing|POS=PRON|Person=1|PrepCase=Npr|PronType=Prs",
483
+ "Mood=Sub|Number=Plur|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin",
484
+ "Mood=Ind|Number=Plur|POS=AUX|Person=2|Tense=Fut|VerbForm=Fin",
485
+ "Mood=Sub|Number=Plur|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin",
486
+ "Mood=Sub|Number=Plur|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin",
487
+ "Number=Plur|POS=PRON|Person=1|PronType=Prs",
488
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin",
489
+ "Case=Nom|Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs",
490
+ "POS=X",
491
+ "Mood=Cnd|Number=Plur|POS=AUX|Person=1|VerbForm=Fin",
492
+ "Number=Sing|POS=DET|PronType=Dem",
493
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Fut|VerbForm=Fin",
494
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin",
495
+ "POS=DET|PronType=Art",
496
+ "Gender=Masc|Number=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs",
497
+ "NumType=Ord|Number=Sing|POS=ADJ",
498
+ "Number=Plur|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs",
499
+ "Number=Plur|POS=PRON|PronType=Dem",
500
+ "Mood=Imp|Number=Plur|POS=VERB|Person=1|VerbForm=Fin",
501
+ "POS=PRON|PronType=Ind",
502
+ "POS=SYM",
503
+ "Mood=Ind|Number=Sing|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin",
504
+ "Mood=Imp|Number=Plur|POS=VERB|Person=3|VerbForm=Fin",
505
+ "POS=VERB|VerbForm=Fin",
506
+ "Case=Nom|Number=Sing|POS=PRON|Person=1|PronType=Prs",
507
+ "Case=Acc|Number=Sing|POS=PRON|Person=1|PrepCase=Pre|PronType=Prs",
508
+ "Mood=Ind|Number=Sing|POS=AUX|Person=2|Tense=Pres|VerbForm=Fin",
509
+ "NumForm=Digit|NumType=Frac|POS=SYM",
510
+ "NumType=Card|Number=Sing|POS=NUM",
511
+ "POS=PUNCT|PunctSide=Ini|PunctType=Qest",
512
+ "POS=PUNCT|PunctSide=Fin|PunctType=Qest",
513
+ "NumForm=Digit|NumType=Ord|POS=ADJ",
514
+ "Foreign=Yes|POS=PRON|PronType=Int",
515
+ "Foreign=Yes|Mood=Ind|POS=VERB|VerbForm=Fin",
516
+ "Foreign=Yes|POS=ADP",
517
+ "Gender=Masc|Number=Sing|POS=PROPN",
518
+ "Case=Acc|POS=PRON|Person=3|PrepCase=Pre|PronType=Prs|Reflex=Yes",
519
+ "Mood=Ind|Number=Plur|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin",
520
+ "POS=PUNCT|PunctSide=Ini|PunctType=Excl",
521
+ "POS=PUNCT|PunctSide=Fin|PunctType=Excl",
522
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs",
523
+ "Mood=Cnd|Number=Sing|POS=VERB|Person=1|VerbForm=Fin",
524
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin",
525
+ "Gender=Masc|Number=Plur|POS=PRON|Person=3|Poss=Yes|PronType=Prs",
526
+ "POS=NUM",
527
+ "Mood=Imp|Number=Plur|POS=AUX|Person=3|VerbForm=Fin",
528
+ "Case=Nom|POS=PRON|Person=3|PronType=Prs",
529
+ "Mood=Cnd|Number=Sing|POS=AUX|Person=1|VerbForm=Fin",
530
+ "Number=Plur|POS=PRON|Person=2|Polite=Form|PronType=Prs",
531
+ "Mood=Sub|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin",
532
+ "POS=PUNCT|PunctSide=Ini|PunctType=Comm",
533
+ "POS=PUNCT|PunctSide=Fin|PunctType=Comm",
534
+ "Number=Plur|POS=PRON|Person=2|PronType=Prs",
535
+ "Mood=Ind|Number=Plur|POS=AUX|Person=2|Tense=Pres|VerbForm=Fin",
536
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=2|PronType=Prs",
537
+ "Mood=Cnd|Number=Plur|POS=VERB|Person=1|VerbForm=Fin",
538
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin",
539
+ "Gender=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs",
540
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin",
541
+ "Mood=Sub|Number=Plur|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin",
542
+ "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Art",
543
+ "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs",
544
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
545
+ "POS=VERB|Tense=Past|VerbForm=Part",
546
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Past|VerbForm=Fin",
547
+ "Foreign=Yes|POS=NOUN",
548
+ "Definite=Def|Foreign=Yes|Gender=Masc|Number=Sing|POS=DET|PronType=Art",
549
+ "Foreign=Yes|POS=VERB",
550
+ "Foreign=Yes|POS=ADJ",
551
+ "Foreign=Yes|POS=DET",
552
+ "Foreign=Yes|POS=ADV",
553
+ "Definite=Ind|Gender=Fem|Number=Plur|POS=DET|PronType=Art",
554
+ "POS=INTJ",
555
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin",
556
+ "Mood=Sub|Number=Sing|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin",
557
+ "Case=Acc|POS=PRON|Person=3|PronType=Prs|Reflex=Yes",
558
+ "AdvType=Tim|POS=SYM",
559
+ "Gender=Fem|Number=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs",
560
+ "Definite=Ind|Gender=Fem|Number=Sing|POS=DET|PronType=Art",
561
+ "AdvType=Tim|Degree=Cmp|POS=ADV",
562
+ "Case=Acc|Number=Sing|POS=PRON|Person=2|Polite=Infm|PrepCase=Pre|PronType=Prs",
563
+ "Mood=Sub|Number=Plur|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin",
564
+ "Degree=Cmp|POS=ADJ",
565
+ "POS=DET",
566
+ "Gender=Masc|Number=Sing|Number[psor]=Plur|POS=PRON|Person=1|Poss=Yes|PronType=Prs",
567
+ "Number=Plur|Number[psor]=Plur|POS=PRON|Person=1|Poss=Yes|PronType=Prs",
568
+ "Mood=Ind|Number=Plur|POS=VERB|Person=2|Tense=Fut|VerbForm=Fin",
569
+ "Mood=Sub|Number=Sing|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin",
570
+ "Gender=Masc|POS=SYM",
571
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Past|VerbForm=Fin",
572
+ "Mood=Sub|Number=Sing|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin",
573
+ "POS=DET|PronType=Rel",
574
+ "Gender=Fem|NumType=Card|POS=NUM",
575
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Past|VerbForm=Fin",
576
+ "Mood=Sub|Number=Plur|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin",
577
+ "POS=AUX|Tense=Past|VerbForm=Part",
578
+ "Foreign=Yes|Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin",
579
+ "Foreign=Yes|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs",
580
+ "Foreign=Yes|POS=SCONJ",
581
+ "Foreign=Yes|Gender=Fem|Number=Sing|POS=DET|PronType=Art",
582
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Fut|VerbForm=Fin",
583
+ "Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs",
584
+ "Gender=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
585
+ "Gender=Fem|Number=Sing|Number[psor]=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs",
586
+ "Gender=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs",
587
+ "Definite=Ind|Number=Sing|POS=DET|PronType=Art",
588
+ "Gender=Fem|Number=Plur|POS=PRON|Person=3|Poss=Yes|PronType=Prs",
589
+ "Gender=Fem|Number=Sing|POS=PROPN",
590
+ "Number=Plur|POS=DET|PronType=Dem",
591
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Rel"
592
+ ],
593
+ "lemmatizer":[
594
+
595
+ ],
596
+ "parser":[
597
+ "ROOT",
598
+ "acl",
599
+ "advcl",
600
+ "advmod",
601
+ "amod",
602
+ "appos",
603
+ "aux",
604
+ "case",
605
+ "cc",
606
+ "ccomp",
607
+ "compound",
608
+ "conj",
609
+ "cop",
610
+ "csubj",
611
+ "dep",
612
+ "det",
613
+ "expl:pass",
614
+ "fixed",
615
+ "flat",
616
+ "iobj",
617
+ "mark",
618
+ "nmod",
619
+ "nsubj",
620
+ "nummod",
621
+ "obj",
622
+ "obl",
623
+ "parataxis",
624
+ "punct",
625
+ "xcomp"
626
+ ],
627
+ "ner":[
628
+ "LOC",
629
+ "MISC",
630
+ "ORG",
631
+ "PER"
632
+ ]
633
+ },
634
+ "pipeline":[
635
+ "transformer",
636
+ "tagger",
637
+ "morphologizer",
638
+ "lemmatizer",
639
+ "parser",
640
+ "ner"
641
+ ],
642
+ "components":[
643
+ "transformer",
644
+ "tagger",
645
+ "morphologizer",
646
+ "lemmatizer",
647
+ "parser",
648
+ "ner"
649
+ ],
650
+ "disabled":[
651
+
652
+ ],
653
+ "performance":{
654
+ "tag_acc":0.9751561894,
655
+ "pos_acc":0.9923557547,
656
+ "morph_acc":0.9896239098,
657
+ "morph_per_feat":{
658
+ "Mood":{
659
+ "p":0.9982762866,
660
+ "r":0.9975393701,
661
+ "f":0.9979076923
662
+ },
663
+ "Number":{
664
+ "p":0.9987768024,
665
+ "r":0.9964466458,
666
+ "f":0.9976103635
667
+ },
668
+ "Person":{
669
+ "p":0.9982300885,
670
+ "r":0.9978768577,
671
+ "f":0.9980534419
672
+ },
673
+ "Tense":{
674
+ "p":0.9945526922,
675
+ "r":0.9953868736,
676
+ "f":0.994969608
677
+ },
678
+ "VerbForm":{
679
+ "p":0.997467342,
680
+ "r":0.9966702184,
681
+ "f":0.9970686209
682
+ },
683
+ "Gender":{
684
+ "p":0.9970477205,
685
+ "r":0.9920543196,
686
+ "f":0.9945447523
687
+ },
688
+ "NumType":{
689
+ "p":0.9650943396,
690
+ "r":0.9641847314,
691
+ "f":0.9646393211
692
+ },
693
+ "Definite":{
694
+ "p":0.9974929951,
695
+ "r":0.9964643489,
696
+ "f":0.9969784067
697
+ },
698
+ "PronType":{
699
+ "p":0.9961138802,
700
+ "r":0.9961138802,
701
+ "f":0.9961138802
702
+ },
703
+ "PunctType":{
704
+ "p":0.9998310525,
705
+ "r":0.9989871708,
706
+ "f":0.9994089335
707
+ },
708
+ "NumForm":{
709
+ "p":0.9819694868,
710
+ "r":0.9943820225,
711
+ "f":0.988136776
712
+ },
713
+ "Polarity":{
714
+ "p":1.0,
715
+ "r":0.9935275081,
716
+ "f":0.9967532468
717
+ },
718
+ "Case":{
719
+ "p":0.9983333333,
720
+ "r":0.9983333333,
721
+ "f":0.9983333333
722
+ },
723
+ "PrepCase":{
724
+ "p":0.9972413793,
725
+ "r":1.0,
726
+ "f":0.9986187845
727
+ },
728
+ "Reflex":{
729
+ "p":0.9986072423,
730
+ "r":1.0,
731
+ "f":0.9993031359
732
+ },
733
+ "Degree":{
734
+ "p":0.9964664311,
735
+ "r":0.9964664311,
736
+ "f":0.9964664311
737
+ },
738
+ "Poss":{
739
+ "p":0.9914529915,
740
+ "r":0.9971346705,
741
+ "f":0.9942857143
742
+ },
743
+ "AdvType":{
744
+ "p":1.0,
745
+ "r":0.9197080292,
746
+ "f":0.9581749049
747
+ },
748
+ "PunctSide":{
749
+ "p":0.9975728155,
750
+ "r":0.9927536232,
751
+ "f":0.995157385
752
+ },
753
+ "Number[psor]":{
754
+ "p":1.0,
755
+ "r":1.0,
756
+ "f":1.0
757
+ },
758
+ "Foreign":{
759
+ "p":0.0,
760
+ "r":0.0,
761
+ "f":0.0
762
+ },
763
+ "Polite":{
764
+ "p":1.0,
765
+ "r":0.3333333333,
766
+ "f":0.5
767
+ }
768
+ },
769
+ "lemma_acc":0.9648130959,
770
+ "dep_uas":0.9525272994,
771
+ "dep_las":0.934621442,
772
+ "dep_las_per_type":{
773
+ "nsubj":{
774
+ "p":0.9551878663,
775
+ "r":0.9545297968,
776
+ "f":0.9548587181
777
+ },
778
+ "flat":{
779
+ "p":0.9321291735,
780
+ "r":0.9326396495,
781
+ "f":0.9323843416
782
+ },
783
+ "case":{
784
+ "p":0.9767639903,
785
+ "r":0.9738023044,
786
+ "f":0.9752808989
787
+ },
788
+ "aux":{
789
+ "p":0.9696805631,
790
+ "r":0.9749591726,
791
+ "f":0.9723127036
792
+ },
793
+ "root":{
794
+ "p":0.967251462,
795
+ "r":0.9678174371,
796
+ "f":0.9675343668
797
+ },
798
+ "nummod":{
799
+ "p":0.920071048,
800
+ "r":0.9168141593,
801
+ "f":0.9184397163
802
+ },
803
+ "obj":{
804
+ "p":0.9253548703,
805
+ "r":0.9372830937,
806
+ "f":0.9312807882
807
+ },
808
+ "det":{
809
+ "p":0.9877721763,
810
+ "r":0.9890452153,
811
+ "f":0.9884082859
812
+ },
813
+ "nmod":{
814
+ "p":0.8921591712,
815
+ "r":0.8927898209,
816
+ "f":0.8924743846
817
+ },
818
+ "amod":{
819
+ "p":0.9656214583,
820
+ "r":0.9634376178,
821
+ "f":0.9645283019
822
+ },
823
+ "obl":{
824
+ "p":0.8240566038,
825
+ "r":0.7944520236,
826
+ "f":0.808983561
827
+ },
828
+ "fixed":{
829
+ "p":0.9382129278,
830
+ "r":0.9147358665,
831
+ "f":0.9263256687
832
+ },
833
+ "conj":{
834
+ "p":0.8374164811,
835
+ "r":0.8609044076,
836
+ "f":0.8489980243
837
+ },
838
+ "advmod":{
839
+ "p":0.8960887332,
840
+ "r":0.8924418605,
841
+ "f":0.8942615788
842
+ },
843
+ "advcl":{
844
+ "p":0.7814485388,
845
+ "r":0.7706766917,
846
+ "f":0.7760252366
847
+ },
848
+ "compound":{
849
+ "p":0.8786764706,
850
+ "r":0.8722627737,
851
+ "f":0.8754578755
852
+ },
853
+ "mark":{
854
+ "p":0.9396401625,
855
+ "r":0.9467836257,
856
+ "f":0.9431983688
857
+ },
858
+ "cop":{
859
+ "p":0.875,
860
+ "r":0.9242424242,
861
+ "f":0.8989473684
862
+ },
863
+ "ccomp":{
864
+ "p":0.8617710583,
865
+ "r":0.8847006652,
866
+ "f":0.8730853392
867
+ },
868
+ "acl":{
869
+ "p":0.861163227,
870
+ "r":0.8843930636,
871
+ "f":0.8726235741
872
+ },
873
+ "cc":{
874
+ "p":0.9465838509,
875
+ "r":0.9615141956,
876
+ "f":0.9539906103
877
+ },
878
+ "expl:pass":{
879
+ "p":0.8333333333,
880
+ "r":0.7608695652,
881
+ "f":0.7954545455
882
+ },
883
+ "appos":{
884
+ "p":0.8326898327,
885
+ "r":0.8263090677,
886
+ "f":0.8294871795
887
+ },
888
+ "xcomp":{
889
+ "p":0.8917050691,
890
+ "r":0.8431372549,
891
+ "f":0.8667413214
892
+ },
893
+ "iobj":{
894
+ "p":0.8352272727,
895
+ "r":0.7860962567,
896
+ "f":0.8099173554
897
+ },
898
+ "dep":{
899
+ "p":0.0,
900
+ "r":0.0,
901
+ "f":0.0
902
+ },
903
+ "csubj":{
904
+ "p":0.819047619,
905
+ "r":0.8113207547,
906
+ "f":0.8151658768
907
+ },
908
+ "parataxis":{
909
+ "p":0.775862069,
910
+ "r":0.652173913,
911
+ "f":0.7086614173
912
+ },
913
+ "nsubj:pass":{
914
+ "p":0.0,
915
+ "r":0.0,
916
+ "f":0.0
917
+ },
918
+ "acl:relcl":{
919
+ "p":0.0,
920
+ "r":0.0,
921
+ "f":0.0
922
+ }
923
+ },
924
+ "sents_p":0.9970760234,
925
+ "sents_r":0.99765945,
926
+ "sents_f":0.9973676514,
927
+ "ents_f":0.8976552598,
928
+ "ents_p":0.8993650794,
929
+ "ents_r":0.8959519292,
930
+ "ents_per_type":{
931
+ "ORG":{
932
+ "p":0.8924544666,
933
+ "r":0.8825042882,
934
+ "f":0.8874514877
935
+ },
936
+ "LOC":{
937
+ "p":0.9081196581,
938
+ "r":0.9081196581,
939
+ "f":0.9081196581
940
+ },
941
+ "MISC":{
942
+ "p":0.7994923858,
943
+ "r":0.8097686375,
944
+ "f":0.8045977011
945
+ },
946
+ "PER":{
947
+ "p":0.9580209895,
948
+ "r":0.9523099851,
949
+ "f":0.9551569507
950
+ }
951
+ },
952
+ "transformer_loss":139835.8554264442,
953
+ "tagger_loss":6375.5195332356,
954
+ "morphologizer_loss":3492.7060705093,
955
+ "parser_loss":33211.4097747022,
956
+ "ner_loss":891.3188530404
957
+ },
958
+ "requirements":[
959
+ "spacy-transformers>=1.1.8,<1.2.0"
960
+ ]
961
+ }
morphologizer/cfg ADDED
@@ -0,0 +1,560 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "extend":false,
3
+ "labels_morph":{
4
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Art":"Definite=Def|Gender=Masc|Number=Sing|PronType=Art",
5
+ "POS=PROPN":"",
6
+ "POS=PUNCT|PunctSide=Ini|PunctType=Brck":"PunctSide=Ini|PunctType=Brck",
7
+ "POS=PUNCT|PunctSide=Fin|PunctType=Brck":"PunctSide=Fin|PunctType=Brck",
8
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=3|Tense=Pres|VerbForm=Fin",
9
+ "Gender=Masc|Number=Sing|POS=VERB|Tense=Past|VerbForm=Part":"Gender=Masc|Number=Sing|Tense=Past|VerbForm=Part",
10
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Art":"Definite=Def|Gender=Fem|Number=Sing|PronType=Art",
11
+ "Gender=Fem|Number=Sing|POS=NOUN":"Gender=Fem|Number=Sing",
12
+ "POS=ADP":"",
13
+ "NumType=Card|Number=Plur|POS=NUM":"NumType=Card|Number=Plur",
14
+ "Gender=Masc|Number=Plur|POS=NOUN":"Gender=Masc|Number=Plur",
15
+ "Number=Sing|POS=ADJ":"Number=Sing",
16
+ "POS=CCONJ":"",
17
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Ind":"Gender=Fem|Number=Sing|PronType=Ind",
18
+ "NumForm=Digit|NumType=Card|POS=NUM":"NumForm=Digit|NumType=Card",
19
+ "NumForm=Digit|POS=NOUN":"NumForm=Digit",
20
+ "Gender=Masc|Number=Plur|POS=ADJ":"Gender=Masc|Number=Plur",
21
+ "POS=PUNCT|PunctType=Comm":"PunctType=Comm",
22
+ "POS=AUX|VerbForm=Inf":"VerbForm=Inf",
23
+ "Case=Acc,Dat|POS=PRON|Person=3|PrepCase=Npr|PronType=Prs|Reflex=Yes":"Case=Acc,Dat|Person=3|PrepCase=Npr|PronType=Prs|Reflex=Yes",
24
+ "Definite=Def|Gender=Masc|Number=Plur|POS=DET|PronType=Art":"Definite=Def|Gender=Masc|Number=Plur|PronType=Art",
25
+ "POS=PRON|PronType=Rel":"PronType=Rel",
26
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=3|Tense=Imp|VerbForm=Fin",
27
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Art":"Gender=Fem|Number=Sing|PronType=Art",
28
+ "Gender=Fem|Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Gender=Fem|Number=Sing|Person=3|Poss=Yes|PronType=Prs",
29
+ "Definite=Def|Gender=Fem|Number=Plur|POS=DET|PronType=Art":"Definite=Def|Gender=Fem|Number=Plur|PronType=Art",
30
+ "Gender=Fem|Number=Plur|POS=NOUN":"Gender=Fem|Number=Plur",
31
+ "Gender=Fem|Number=Plur|POS=ADJ":"Gender=Fem|Number=Plur",
32
+ "POS=VERB|VerbForm=Inf":"VerbForm=Inf",
33
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=3|PronType=Prs":"Case=Acc,Dat|Number=Plur|Person=3|PronType=Prs",
34
+ "Number=Plur|POS=ADJ":"Number=Plur",
35
+ "POS=PUNCT|PunctType=Peri":"PunctType=Peri",
36
+ "Number=Sing|POS=PRON|PronType=Rel":"Number=Sing|PronType=Rel",
37
+ "Gender=Masc|Number=Sing|POS=NOUN":"Gender=Masc|Number=Sing",
38
+ "Mood=Imp|Number=Sing|POS=VERB|Person=2|VerbForm=Fin":"Mood=Imp|Number=Sing|Person=2|VerbForm=Fin",
39
+ "Gender=Masc|Number=Plur|POS=ADJ|VerbForm=Part":"Gender=Masc|Number=Plur|VerbForm=Part",
40
+ "POS=SCONJ":"",
41
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=3|Tense=Pres|VerbForm=Fin",
42
+ "Gender=Masc|Number=Plur|POS=VERB|Tense=Past|VerbForm=Part":"Gender=Masc|Number=Plur|Tense=Past|VerbForm=Part",
43
+ "Definite=Def|Number=Sing|POS=DET|PronType=Art":"Definite=Def|Number=Sing|PronType=Art",
44
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Ind":"Gender=Masc|Number=Sing|PronType=Ind",
45
+ "Gender=Fem|Number=Plur|POS=ADJ|VerbForm=Part":"Gender=Fem|Number=Plur|VerbForm=Part",
46
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Dem":"Gender=Masc|Number=Sing|PronType=Dem",
47
+ "POS=VERB|VerbForm=Ger":"VerbForm=Ger",
48
+ "POS=NOUN":"",
49
+ "Gender=Fem|NumType=Card|Number=Sing|POS=NUM":"Gender=Fem|NumType=Card|Number=Sing",
50
+ "Gender=Fem|Number=Sing|POS=ADJ|VerbForm=Part":"Gender=Fem|Number=Sing|VerbForm=Part",
51
+ "Gender=Fem|NumType=Ord|Number=Plur|POS=ADJ":"Gender=Fem|NumType=Ord|Number=Plur",
52
+ "POS=PUNCT|PunctType=Quot":"PunctType=Quot",
53
+ "Gender=Masc|Number=Sing|POS=ADJ":"Gender=Masc|Number=Sing",
54
+ "Gender=Masc|Number=Sing|POS=ADJ|VerbForm=Part":"Gender=Masc|Number=Sing|VerbForm=Part",
55
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=3|Tense=Pres|VerbForm=Fin",
56
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Dem":"Gender=Fem|Number=Sing|PronType=Dem",
57
+ "POS=ADV|Polarity=Neg":"Polarity=Neg",
58
+ "POS=ADV":"",
59
+ "Number=Sing|POS=PRON|PronType=Dem":"Number=Sing|PronType=Dem",
60
+ "Number=Sing|POS=NOUN":"Number=Sing",
61
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=3|Tense=Pres|VerbForm=Fin",
62
+ "Number=Plur|POS=NOUN":"Number=Plur",
63
+ "Mood=Sub|Number=Plur|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=3|Tense=Imp|VerbForm=Fin",
64
+ "Gender=Fem|Number=Sing|POS=ADJ":"Gender=Fem|Number=Sing",
65
+ "Mood=Sub|Number=Sing|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Sing|Person=1|Tense=Pres|VerbForm=Fin",
66
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Tot":"Gender=Masc|Number=Sing|PronType=Tot",
67
+ "Case=Loc|POS=PRON|Person=3|PronType=Prs":"Case=Loc|Person=3|PronType=Prs",
68
+ "Gender=Fem|NumType=Ord|Number=Sing|POS=ADJ":"Gender=Fem|NumType=Ord|Number=Sing",
69
+ "Degree=Cmp|POS=ADV":"Degree=Cmp",
70
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Art":"Gender=Fem|Number=Plur|PronType=Art",
71
+ "Gender=Fem|Number=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Gender=Fem|Number=Plur|Person=3|Poss=Yes|PronType=Prs",
72
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=3|Tense=Fut|VerbForm=Fin",
73
+ "Gender=Masc|NumType=Ord|Number=Sing|POS=ADJ":"Gender=Masc|NumType=Ord|Number=Sing",
74
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=3|Tense=Fut|VerbForm=Fin",
75
+ "NumType=Card|POS=NUM":"NumType=Card",
76
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=3|Tense=Fut|VerbForm=Fin",
77
+ "Number=Sing|POS=PRON|PronType=Ind":"Number=Sing|PronType=Ind",
78
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Art":"Gender=Masc|Number=Sing|PronType=Art",
79
+ "Number=Plur|POS=DET|PronType=Ind":"Number=Plur|PronType=Ind",
80
+ "Mood=Sub|Number=Plur|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=3|Tense=Pres|VerbForm=Fin",
81
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Dem":"Gender=Masc|Number=Plur|PronType=Dem",
82
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=3|Tense=Fut|VerbForm=Fin",
83
+ "Gender=Masc|NumType=Card|Number=Sing|POS=NUM":"Gender=Masc|NumType=Card|Number=Sing",
84
+ "Mood=Sub|Number=Plur|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=3|Tense=Pres|VerbForm=Fin",
85
+ "Case=Acc|Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Case=Acc|Gender=Fem|Number=Sing|Person=3|PronType=Prs",
86
+ "Number=Sing|POS=DET|PronType=Ind":"Number=Sing|PronType=Ind",
87
+ "POS=PUNCT":"",
88
+ "Number=Sing|POS=DET|PronType=Rel":"Number=Sing|PronType=Rel",
89
+ "Case=Gen|POS=PRON|Person=3|PronType=Prs":"Case=Gen|Person=3|PronType=Prs",
90
+ "Gender=Fem|NumType=Card|Number=Plur|POS=NUM":"Gender=Fem|NumType=Card|Number=Plur",
91
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=1|Tense=Pres|VerbForm=Fin",
92
+ "POS=DET|PronType=Ind":"PronType=Ind",
93
+ "Case=Acc|Gender=Neut|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Case=Acc|Gender=Neut|Number=Sing|Person=3|PronType=Prs",
94
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=1|PronType=Prs":"Case=Acc,Dat|Number=Plur|Person=1|PronType=Prs",
95
+ "Degree=Cmp|Number=Sing|POS=ADJ":"Degree=Cmp|Number=Sing",
96
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Ind":"Gender=Masc|Number=Plur|PronType=Ind",
97
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Dem":"Gender=Fem|Number=Plur|PronType=Dem",
98
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Art":"Gender=Masc|Number=Plur|PronType=Art",
99
+ "Gender=Masc|Number=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Plur|Person=3|Poss=Yes|PronType=Prs",
100
+ "Case=Acc|Gender=Fem,Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Case=Acc|Gender=Fem,Masc|Number=Sing|Person=3|PronType=Prs",
101
+ "Gender=Fem|Number=Sing|POS=VERB|Tense=Past|VerbForm=Part":"Gender=Fem|Number=Sing|Tense=Past|VerbForm=Part",
102
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Ind":"Gender=Masc|Number=Sing|PronType=Ind",
103
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Ind":"Gender=Fem|Number=Plur|PronType=Ind",
104
+ "Mood=Sub|Number=Sing|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Sing|Person=3|Tense=Pres|VerbForm=Fin",
105
+ "Number=Plur|POS=PRON|PronType=Rel":"Number=Plur|PronType=Rel",
106
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Int":"Gender=Masc|Number=Plur|PronType=Int",
107
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=3|Tense=Imp|VerbForm=Fin",
108
+ "AdvType=Tim|POS=NOUN":"AdvType=Tim",
109
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Ind":"Gender=Masc|Number=Plur|PronType=Ind",
110
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Ind":"Gender=Fem|Number=Plur|PronType=Ind",
111
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Int":"Gender=Masc|Number=Sing|PronType=Int",
112
+ "Mood=Cnd|Number=Sing|POS=AUX|Person=3|VerbForm=Fin":"Mood=Cnd|Number=Sing|Person=3|VerbForm=Fin",
113
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=3|Tense=Imp|VerbForm=Fin",
114
+ "Number=Sing|POS=DET|PronType=Art":"Number=Sing|PronType=Art",
115
+ "Gender=Masc|Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Sing|Person=3|Poss=Yes|PronType=Prs",
116
+ "Case=Acc|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Case=Acc|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
117
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Int":"Gender=Masc|Number=Sing|PronType=Int",
118
+ "POS=PUNCT|PunctType=Semi":"PunctType=Semi",
119
+ "Mood=Cnd|Number=Plur|POS=AUX|Person=3|VerbForm=Fin":"Mood=Cnd|Number=Plur|Person=3|VerbForm=Fin",
120
+ "Case=Dat|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Case=Dat|Number=Sing|Person=3|PronType=Prs",
121
+ "Gender=Masc|NumType=Card|Number=Plur|POS=NUM":"Gender=Masc|NumType=Card|Number=Plur",
122
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=3|Tense=Imp|VerbForm=Fin",
123
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Ind":"Gender=Fem|Number=Sing|PronType=Ind",
124
+ "Mood=Sub|Number=Sing|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin":"Mood=Sub|Number=Sing|Person=3|Tense=Imp|VerbForm=Fin",
125
+ "NumForm=Digit|POS=SYM":"NumForm=Digit",
126
+ "Gender=Masc|Number=Sing|POS=AUX|Tense=Past|VerbForm=Part":"Gender=Masc|Number=Sing|Tense=Past|VerbForm=Part",
127
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Int":"Gender=Fem|Number=Sing|PronType=Int",
128
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Int":"Gender=Fem|Number=Sing|PronType=Int",
129
+ "POS=PRON|PronType=Int":"PronType=Int",
130
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Int":"Gender=Fem|Number=Plur|PronType=Int",
131
+ "Mood=Cnd|Number=Sing|POS=VERB|Person=3|VerbForm=Fin":"Mood=Cnd|Number=Sing|Person=3|VerbForm=Fin",
132
+ "Mood=Cnd|Number=Plur|POS=VERB|Person=3|VerbForm=Fin":"Mood=Cnd|Number=Plur|Person=3|VerbForm=Fin",
133
+ "POS=PART":"",
134
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Dem":"Gender=Fem|Number=Sing|PronType=Dem",
135
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Tot":"Gender=Masc|Number=Sing|PronType=Tot",
136
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Dem":"Gender=Masc|Number=Plur|PronType=Dem",
137
+ "POS=ADJ":"",
138
+ "Gender=Masc|Number=Plur|POS=PRON|Person=3|PronType=Prs":"Gender=Masc|Number=Plur|Person=3|PronType=Prs",
139
+ "Degree=Cmp|Number=Plur|POS=ADJ":"Degree=Cmp|Number=Plur",
140
+ "POS=PUNCT|PunctType=Dash":"PunctType=Dash",
141
+ "Mood=Sub|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Sing|Person=3|Tense=Pres|VerbForm=Fin",
142
+ "Case=Acc|Gender=Fem|Number=Plur|POS=PRON|Person=3|PronType=Prs":"Case=Acc|Gender=Fem|Number=Plur|Person=3|PronType=Prs",
143
+ "Mood=Sub|Number=Sing|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin":"Mood=Sub|Number=Sing|Person=3|Tense=Imp|VerbForm=Fin",
144
+ "Gender=Fem|Number=Plur|POS=VERB|Tense=Past|VerbForm=Part":"Gender=Fem|Number=Plur|Tense=Past|VerbForm=Part",
145
+ "Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Gender=Fem|Number=Sing|Person=3|PronType=Prs",
146
+ "Gender=Masc|POS=NOUN":"Gender=Masc",
147
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Past|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=3|Tense=Past|VerbForm=Fin",
148
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Int":"Gender=Fem|Number=Plur|PronType=Int",
149
+ "Gender=Masc|NumType=Ord|Number=Plur|POS=ADJ":"Gender=Masc|NumType=Ord|Number=Plur",
150
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=1|Tense=Fut|VerbForm=Fin",
151
+ "POS=PUNCT|PunctType=Colo":"PunctType=Colo",
152
+ "Gender=Masc|NumType=Card|POS=NUM":"Gender=Masc|NumType=Card",
153
+ "Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Gender=Masc|Number=Sing|Person=3|PronType=Prs",
154
+ "Number=Sing|POS=PRON|PronType=Int":"Number=Sing|PronType=Int",
155
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=1|Tense=Fut|VerbForm=Fin",
156
+ "Mood=Imp|Number=Sing|POS=VERB|Person=3|VerbForm=Fin":"Mood=Imp|Number=Sing|Person=3|VerbForm=Fin",
157
+ "Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Gender=Fem|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
158
+ "Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
159
+ "POS=AUX|VerbForm=Ger":"VerbForm=Ger",
160
+ "Gender=Fem|Number=Plur|POS=PRON|Person=3|PronType=Prs":"Gender=Fem|Number=Plur|Person=3|PronType=Prs",
161
+ "Mood=Imp|Number=Sing|POS=AUX|Person=3|VerbForm=Fin":"Mood=Imp|Number=Sing|Person=3|VerbForm=Fin",
162
+ "Number=Plur|POS=PRON|PronType=Ind":"Number=Plur|PronType=Ind",
163
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Dem":"Gender=Masc|Number=Sing|PronType=Dem",
164
+ "Case=Acc,Dat|Number=Sing|POS=PRON|Person=2|Polite=Infm|PrepCase=Npr|PronType=Prs":"Case=Acc,Dat|Number=Sing|Person=2|Polite=Infm|PrepCase=Npr|PronType=Prs",
165
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Int":"Gender=Masc|Number=Plur|PronType=Int",
166
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=1|Tense=Pres|VerbForm=Fin",
167
+ "NumForm=Digit|NumType=Frac|POS=NUM":"NumForm=Digit|NumType=Frac",
168
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Dem":"Gender=Fem|Number=Plur|PronType=Dem",
169
+ "Gender=Fem|POS=NOUN":"Gender=Fem",
170
+ "Case=Acc,Dat|Number=Sing|POS=PRON|Person=1|PrepCase=Npr|PronType=Prs":"Case=Acc,Dat|Number=Sing|Person=1|PrepCase=Npr|PronType=Prs",
171
+ "Mood=Sub|Number=Plur|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=2|Tense=Pres|VerbForm=Fin",
172
+ "Mood=Ind|Number=Plur|POS=AUX|Person=2|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=2|Tense=Fut|VerbForm=Fin",
173
+ "Mood=Sub|Number=Plur|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=1|Tense=Pres|VerbForm=Fin",
174
+ "Mood=Sub|Number=Plur|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=3|Tense=Imp|VerbForm=Fin",
175
+ "Number=Plur|POS=PRON|Person=1|PronType=Prs":"Number=Plur|Person=1|PronType=Prs",
176
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=1|Tense=Pres|VerbForm=Fin",
177
+ "Case=Nom|Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs":"Case=Nom|Number=Sing|Person=2|Polite=Infm|PronType=Prs",
178
+ "POS=X":"",
179
+ "Mood=Cnd|Number=Plur|POS=AUX|Person=1|VerbForm=Fin":"Mood=Cnd|Number=Plur|Person=1|VerbForm=Fin",
180
+ "Number=Sing|POS=DET|PronType=Dem":"Number=Sing|PronType=Dem",
181
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=1|Tense=Fut|VerbForm=Fin",
182
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=1|Tense=Pres|VerbForm=Fin",
183
+ "POS=DET|PronType=Art":"PronType=Art",
184
+ "Gender=Masc|Number=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Sing|Person=3|Poss=Yes|PronType=Prs",
185
+ "NumType=Ord|Number=Sing|POS=ADJ":"NumType=Ord|Number=Sing",
186
+ "Number=Plur|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Number=Plur|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
187
+ "Number=Plur|POS=PRON|PronType=Dem":"Number=Plur|PronType=Dem",
188
+ "Mood=Imp|Number=Plur|POS=VERB|Person=1|VerbForm=Fin":"Mood=Imp|Number=Plur|Person=1|VerbForm=Fin",
189
+ "POS=PRON|PronType=Ind":"PronType=Ind",
190
+ "POS=SYM":"",
191
+ "Mood=Ind|Number=Sing|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=2|Tense=Pres|VerbForm=Fin",
192
+ "Mood=Imp|Number=Plur|POS=VERB|Person=3|VerbForm=Fin":"Mood=Imp|Number=Plur|Person=3|VerbForm=Fin",
193
+ "POS=VERB|VerbForm=Fin":"VerbForm=Fin",
194
+ "Case=Nom|Number=Sing|POS=PRON|Person=1|PronType=Prs":"Case=Nom|Number=Sing|Person=1|PronType=Prs",
195
+ "Case=Acc|Number=Sing|POS=PRON|Person=1|PrepCase=Pre|PronType=Prs":"Case=Acc|Number=Sing|Person=1|PrepCase=Pre|PronType=Prs",
196
+ "Mood=Ind|Number=Sing|POS=AUX|Person=2|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=2|Tense=Pres|VerbForm=Fin",
197
+ "NumForm=Digit|NumType=Frac|POS=SYM":"NumForm=Digit|NumType=Frac",
198
+ "NumType=Card|Number=Sing|POS=NUM":"NumType=Card|Number=Sing",
199
+ "POS=PUNCT|PunctSide=Ini|PunctType=Qest":"PunctSide=Ini|PunctType=Qest",
200
+ "POS=PUNCT|PunctSide=Fin|PunctType=Qest":"PunctSide=Fin|PunctType=Qest",
201
+ "NumForm=Digit|NumType=Ord|POS=ADJ":"NumForm=Digit|NumType=Ord",
202
+ "Foreign=Yes|POS=PRON|PronType=Int":"Foreign=Yes|PronType=Int",
203
+ "Foreign=Yes|Mood=Ind|POS=VERB|VerbForm=Fin":"Foreign=Yes|Mood=Ind|VerbForm=Fin",
204
+ "Foreign=Yes|POS=ADP":"Foreign=Yes",
205
+ "Gender=Masc|Number=Sing|POS=PROPN":"Gender=Masc|Number=Sing",
206
+ "Case=Acc|POS=PRON|Person=3|PrepCase=Pre|PronType=Prs|Reflex=Yes":"Case=Acc|Person=3|PrepCase=Pre|PronType=Prs|Reflex=Yes",
207
+ "Mood=Ind|Number=Plur|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=2|Tense=Pres|VerbForm=Fin",
208
+ "POS=PUNCT|PunctSide=Ini|PunctType=Excl":"PunctSide=Ini|PunctType=Excl",
209
+ "POS=PUNCT|PunctSide=Fin|PunctType=Excl":"PunctSide=Fin|PunctType=Excl",
210
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Sing|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
211
+ "Mood=Cnd|Number=Sing|POS=VERB|Person=1|VerbForm=Fin":"Mood=Cnd|Number=Sing|Person=1|VerbForm=Fin",
212
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=1|Tense=Imp|VerbForm=Fin",
213
+ "Gender=Masc|Number=Plur|POS=PRON|Person=3|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Plur|Person=3|Poss=Yes|PronType=Prs",
214
+ "POS=NUM":"",
215
+ "Mood=Imp|Number=Plur|POS=AUX|Person=3|VerbForm=Fin":"Mood=Imp|Number=Plur|Person=3|VerbForm=Fin",
216
+ "Case=Nom|POS=PRON|Person=3|PronType=Prs":"Case=Nom|Person=3|PronType=Prs",
217
+ "Mood=Cnd|Number=Sing|POS=AUX|Person=1|VerbForm=Fin":"Mood=Cnd|Number=Sing|Person=1|VerbForm=Fin",
218
+ "Number=Plur|POS=PRON|Person=2|Polite=Form|PronType=Prs":"Number=Plur|Person=2|Polite=Form|PronType=Prs",
219
+ "Mood=Sub|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin":"Mood=Sub|Person=1|Tense=Imp|VerbForm=Fin",
220
+ "POS=PUNCT|PunctSide=Ini|PunctType=Comm":"PunctSide=Ini|PunctType=Comm",
221
+ "POS=PUNCT|PunctSide=Fin|PunctType=Comm":"PunctSide=Fin|PunctType=Comm",
222
+ "Number=Plur|POS=PRON|Person=2|PronType=Prs":"Number=Plur|Person=2|PronType=Prs",
223
+ "Mood=Ind|Number=Plur|POS=AUX|Person=2|Tense=Pres|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=2|Tense=Pres|VerbForm=Fin",
224
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=2|PronType=Prs":"Case=Acc,Dat|Number=Plur|Person=2|PronType=Prs",
225
+ "Mood=Cnd|Number=Plur|POS=VERB|Person=1|VerbForm=Fin":"Mood=Cnd|Number=Plur|Person=1|VerbForm=Fin",
226
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=1|Tense=Imp|VerbForm=Fin",
227
+ "Gender=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Plur|Number[psor]=Sing|Person=1|Poss=Yes|PronType=Prs",
228
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=1|Tense=Imp|VerbForm=Fin",
229
+ "Mood=Sub|Number=Plur|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=1|Tense=Pres|VerbForm=Fin",
230
+ "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Art":"Definite=Ind|Gender=Masc|Number=Sing|PronType=Art",
231
+ "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs":"Number=Sing|Person=2|Polite=Form|PronType=Prs",
232
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
233
+ "POS=VERB|Tense=Past|VerbForm=Part":"Tense=Past|VerbForm=Part",
234
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Past|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=3|Tense=Past|VerbForm=Fin",
235
+ "Foreign=Yes|POS=NOUN":"Foreign=Yes",
236
+ "Definite=Def|Foreign=Yes|Gender=Masc|Number=Sing|POS=DET|PronType=Art":"Definite=Def|Foreign=Yes|Gender=Masc|Number=Sing|PronType=Art",
237
+ "Foreign=Yes|POS=VERB":"Foreign=Yes",
238
+ "Foreign=Yes|POS=ADJ":"Foreign=Yes",
239
+ "Foreign=Yes|POS=DET":"Foreign=Yes",
240
+ "Foreign=Yes|POS=ADV":"Foreign=Yes",
241
+ "Definite=Ind|Gender=Fem|Number=Plur|POS=DET|PronType=Art":"Definite=Ind|Gender=Fem|Number=Plur|PronType=Art",
242
+ "POS=INTJ":"",
243
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=1|Tense=Imp|VerbForm=Fin",
244
+ "Mood=Sub|Number=Sing|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Sing|Person=2|Tense=Pres|VerbForm=Fin",
245
+ "Case=Acc|POS=PRON|Person=3|PronType=Prs|Reflex=Yes":"Case=Acc|Person=3|PronType=Prs|Reflex=Yes",
246
+ "AdvType=Tim|POS=SYM":"AdvType=Tim",
247
+ "Gender=Fem|Number=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs":"Gender=Fem|Number=Sing|Person=3|Poss=Yes|PronType=Prs",
248
+ "Definite=Ind|Gender=Fem|Number=Sing|POS=DET|PronType=Art":"Definite=Ind|Gender=Fem|Number=Sing|PronType=Art",
249
+ "AdvType=Tim|Degree=Cmp|POS=ADV":"AdvType=Tim|Degree=Cmp",
250
+ "Case=Acc|Number=Sing|POS=PRON|Person=2|Polite=Infm|PrepCase=Pre|PronType=Prs":"Case=Acc|Number=Sing|Person=2|Polite=Infm|PrepCase=Pre|PronType=Prs",
251
+ "Mood=Sub|Number=Plur|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=1|Tense=Imp|VerbForm=Fin",
252
+ "Degree=Cmp|POS=ADJ":"Degree=Cmp",
253
+ "POS=DET":"",
254
+ "Gender=Masc|Number=Sing|Number[psor]=Plur|POS=PRON|Person=1|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
255
+ "Number=Plur|Number[psor]=Plur|POS=PRON|Person=1|Poss=Yes|PronType=Prs":"Number=Plur|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs",
256
+ "Mood=Ind|Number=Plur|POS=VERB|Person=2|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=2|Tense=Fut|VerbForm=Fin",
257
+ "Mood=Sub|Number=Sing|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin":"Mood=Sub|Number=Sing|Person=1|Tense=Pres|VerbForm=Fin",
258
+ "Gender=Masc|POS=SYM":"Gender=Masc",
259
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Past|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=3|Tense=Past|VerbForm=Fin",
260
+ "Mood=Sub|Number=Sing|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin":"Mood=Sub|Number=Sing|Person=1|Tense=Imp|VerbForm=Fin",
261
+ "POS=DET|PronType=Rel":"PronType=Rel",
262
+ "Gender=Fem|NumType=Card|POS=NUM":"Gender=Fem|NumType=Card",
263
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Past|VerbForm=Fin":"Mood=Ind|Number=Plur|Person=3|Tense=Past|VerbForm=Fin",
264
+ "Mood=Sub|Number=Plur|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin":"Mood=Sub|Number=Plur|Person=1|Tense=Imp|VerbForm=Fin",
265
+ "POS=AUX|Tense=Past|VerbForm=Part":"Tense=Past|VerbForm=Part",
266
+ "Foreign=Yes|Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":"Foreign=Yes|Mood=Ind|Number=Sing|Person=3|Tense=Pres|VerbForm=Fin",
267
+ "Foreign=Yes|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":"Foreign=Yes|Gender=Masc|Number=Sing|Person=3|PronType=Prs",
268
+ "Foreign=Yes|POS=SCONJ":"Foreign=Yes",
269
+ "Foreign=Yes|Gender=Fem|Number=Sing|POS=DET|PronType=Art":"Foreign=Yes|Gender=Fem|Number=Sing|PronType=Art",
270
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Fut|VerbForm=Fin":"Mood=Ind|Number=Sing|Person=1|Tense=Fut|VerbForm=Fin",
271
+ "Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Number=Sing|Person=3|Poss=Yes|PronType=Prs",
272
+ "Gender=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Gender=Fem|Number=Sing|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
273
+ "Gender=Fem|Number=Sing|Number[psor]=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs":"Gender=Fem|Number=Sing|Number[psor]=Sing|Person=3|Poss=Yes|PronType=Prs",
274
+ "Gender=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":"Gender=Masc|Number=Plur|Number[psor]=Sing|Person=2|Poss=Yes|PronType=Prs",
275
+ "Definite=Ind|Number=Sing|POS=DET|PronType=Art":"Definite=Ind|Number=Sing|PronType=Art",
276
+ "Gender=Fem|Number=Plur|POS=PRON|Person=3|Poss=Yes|PronType=Prs":"Gender=Fem|Number=Plur|Person=3|Poss=Yes|PronType=Prs",
277
+ "Gender=Fem|Number=Sing|POS=PROPN":"Gender=Fem|Number=Sing",
278
+ "Number=Plur|POS=DET|PronType=Dem":"Number=Plur|PronType=Dem",
279
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Rel":"Gender=Masc|Number=Sing|PronType=Rel"
280
+ },
281
+ "labels_pos":{
282
+ "Definite=Def|Gender=Masc|Number=Sing|POS=DET|PronType=Art":90,
283
+ "POS=PROPN":96,
284
+ "POS=PUNCT|PunctSide=Ini|PunctType=Brck":97,
285
+ "POS=PUNCT|PunctSide=Fin|PunctType=Brck":97,
286
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":87,
287
+ "Gender=Masc|Number=Sing|POS=VERB|Tense=Past|VerbForm=Part":100,
288
+ "Definite=Def|Gender=Fem|Number=Sing|POS=DET|PronType=Art":90,
289
+ "Gender=Fem|Number=Sing|POS=NOUN":92,
290
+ "POS=ADP":85,
291
+ "NumType=Card|Number=Plur|POS=NUM":93,
292
+ "Gender=Masc|Number=Plur|POS=NOUN":92,
293
+ "Number=Sing|POS=ADJ":84,
294
+ "POS=CCONJ":89,
295
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Ind":90,
296
+ "NumForm=Digit|NumType=Card|POS=NUM":93,
297
+ "NumForm=Digit|POS=NOUN":92,
298
+ "Gender=Masc|Number=Plur|POS=ADJ":84,
299
+ "POS=PUNCT|PunctType=Comm":97,
300
+ "POS=AUX|VerbForm=Inf":87,
301
+ "Case=Acc,Dat|POS=PRON|Person=3|PrepCase=Npr|PronType=Prs|Reflex=Yes":95,
302
+ "Definite=Def|Gender=Masc|Number=Plur|POS=DET|PronType=Art":90,
303
+ "POS=PRON|PronType=Rel":95,
304
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin":100,
305
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Art":90,
306
+ "Gender=Fem|Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
307
+ "Definite=Def|Gender=Fem|Number=Plur|POS=DET|PronType=Art":90,
308
+ "Gender=Fem|Number=Plur|POS=NOUN":92,
309
+ "Gender=Fem|Number=Plur|POS=ADJ":84,
310
+ "POS=VERB|VerbForm=Inf":100,
311
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=3|PronType=Prs":95,
312
+ "Number=Plur|POS=ADJ":84,
313
+ "POS=PUNCT|PunctType=Peri":97,
314
+ "Number=Sing|POS=PRON|PronType=Rel":95,
315
+ "Gender=Masc|Number=Sing|POS=NOUN":92,
316
+ "Mood=Imp|Number=Sing|POS=VERB|Person=2|VerbForm=Fin":100,
317
+ "Gender=Masc|Number=Plur|POS=ADJ|VerbForm=Part":84,
318
+ "POS=SCONJ":98,
319
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":87,
320
+ "Gender=Masc|Number=Plur|POS=VERB|Tense=Past|VerbForm=Part":100,
321
+ "Definite=Def|Number=Sing|POS=DET|PronType=Art":90,
322
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Ind":90,
323
+ "Gender=Fem|Number=Plur|POS=ADJ|VerbForm=Part":84,
324
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Dem":90,
325
+ "POS=VERB|VerbForm=Ger":100,
326
+ "POS=NOUN":92,
327
+ "Gender=Fem|NumType=Card|Number=Sing|POS=NUM":93,
328
+ "Gender=Fem|Number=Sing|POS=ADJ|VerbForm=Part":84,
329
+ "Gender=Fem|NumType=Ord|Number=Plur|POS=ADJ":84,
330
+ "POS=PUNCT|PunctType=Quot":97,
331
+ "Gender=Masc|Number=Sing|POS=ADJ":84,
332
+ "Gender=Masc|Number=Sing|POS=ADJ|VerbForm=Part":84,
333
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin":100,
334
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Dem":90,
335
+ "POS=ADV|Polarity=Neg":86,
336
+ "POS=ADV":86,
337
+ "Number=Sing|POS=PRON|PronType=Dem":95,
338
+ "Number=Sing|POS=NOUN":92,
339
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin":100,
340
+ "Number=Plur|POS=NOUN":92,
341
+ "Mood=Sub|Number=Plur|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin":100,
342
+ "Gender=Fem|Number=Sing|POS=ADJ":84,
343
+ "Mood=Sub|Number=Sing|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin":100,
344
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Tot":95,
345
+ "Case=Loc|POS=PRON|Person=3|PronType=Prs":95,
346
+ "Gender=Fem|NumType=Ord|Number=Sing|POS=ADJ":84,
347
+ "Degree=Cmp|POS=ADV":86,
348
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Art":90,
349
+ "Gender=Fem|Number=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
350
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Fut|VerbForm=Fin":100,
351
+ "Gender=Masc|NumType=Ord|Number=Sing|POS=ADJ":84,
352
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Fut|VerbForm=Fin":87,
353
+ "NumType=Card|POS=NUM":93,
354
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Fut|VerbForm=Fin":100,
355
+ "Number=Sing|POS=PRON|PronType=Ind":95,
356
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Art":90,
357
+ "Number=Plur|POS=DET|PronType=Ind":90,
358
+ "Mood=Sub|Number=Plur|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin":100,
359
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Dem":90,
360
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Fut|VerbForm=Fin":87,
361
+ "Gender=Masc|NumType=Card|Number=Sing|POS=NUM":93,
362
+ "Mood=Sub|Number=Plur|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":87,
363
+ "Case=Acc|Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
364
+ "Number=Sing|POS=DET|PronType=Ind":90,
365
+ "POS=PUNCT":97,
366
+ "Number=Sing|POS=DET|PronType=Rel":90,
367
+ "Case=Gen|POS=PRON|Person=3|PronType=Prs":95,
368
+ "Gender=Fem|NumType=Card|Number=Plur|POS=NUM":93,
369
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin":100,
370
+ "POS=DET|PronType=Ind":90,
371
+ "Case=Acc|Gender=Neut|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
372
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=1|PronType=Prs":95,
373
+ "Degree=Cmp|Number=Sing|POS=ADJ":84,
374
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Ind":95,
375
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Dem":90,
376
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Art":90,
377
+ "Gender=Masc|Number=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
378
+ "Case=Acc|Gender=Fem,Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
379
+ "Gender=Fem|Number=Sing|POS=VERB|Tense=Past|VerbForm=Part":100,
380
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Ind":95,
381
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Ind":95,
382
+ "Mood=Sub|Number=Sing|POS=VERB|Person=3|Tense=Pres|VerbForm=Fin":100,
383
+ "Number=Plur|POS=PRON|PronType=Rel":95,
384
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Int":90,
385
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin":87,
386
+ "AdvType=Tim|POS=NOUN":92,
387
+ "Gender=Masc|Number=Plur|POS=DET|PronType=Ind":90,
388
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Ind":90,
389
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Int":90,
390
+ "Mood=Cnd|Number=Sing|POS=AUX|Person=3|VerbForm=Fin":87,
391
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin":100,
392
+ "Number=Sing|POS=DET|PronType=Art":90,
393
+ "Gender=Masc|Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
394
+ "Case=Acc|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
395
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Int":95,
396
+ "POS=PUNCT|PunctType=Semi":97,
397
+ "Mood=Cnd|Number=Plur|POS=AUX|Person=3|VerbForm=Fin":87,
398
+ "Case=Dat|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
399
+ "Gender=Masc|NumType=Card|Number=Plur|POS=NUM":93,
400
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin":87,
401
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Ind":95,
402
+ "Mood=Sub|Number=Sing|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin":87,
403
+ "NumForm=Digit|POS=SYM":99,
404
+ "Gender=Masc|Number=Sing|POS=AUX|Tense=Past|VerbForm=Part":87,
405
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Int":95,
406
+ "Gender=Fem|Number=Sing|POS=DET|PronType=Int":90,
407
+ "POS=PRON|PronType=Int":95,
408
+ "Gender=Fem|Number=Plur|POS=DET|PronType=Int":90,
409
+ "Mood=Cnd|Number=Sing|POS=VERB|Person=3|VerbForm=Fin":100,
410
+ "Mood=Cnd|Number=Plur|POS=VERB|Person=3|VerbForm=Fin":100,
411
+ "POS=PART":94,
412
+ "Gender=Fem|Number=Sing|POS=PRON|PronType=Dem":95,
413
+ "Gender=Masc|Number=Sing|POS=DET|PronType=Tot":90,
414
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Dem":95,
415
+ "POS=ADJ":84,
416
+ "Gender=Masc|Number=Plur|POS=PRON|Person=3|PronType=Prs":95,
417
+ "Degree=Cmp|Number=Plur|POS=ADJ":84,
418
+ "POS=PUNCT|PunctType=Dash":97,
419
+ "Mood=Sub|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":87,
420
+ "Case=Acc|Gender=Fem|Number=Plur|POS=PRON|Person=3|PronType=Prs":95,
421
+ "Mood=Sub|Number=Sing|POS=VERB|Person=3|Tense=Imp|VerbForm=Fin":100,
422
+ "Gender=Fem|Number=Plur|POS=VERB|Tense=Past|VerbForm=Part":100,
423
+ "Gender=Fem|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
424
+ "Gender=Masc|POS=NOUN":92,
425
+ "Mood=Ind|Number=Sing|POS=VERB|Person=3|Tense=Past|VerbForm=Fin":100,
426
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Int":95,
427
+ "Gender=Masc|NumType=Ord|Number=Plur|POS=ADJ":84,
428
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Fut|VerbForm=Fin":100,
429
+ "POS=PUNCT|PunctType=Colo":97,
430
+ "Gender=Masc|NumType=Card|POS=NUM":93,
431
+ "Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
432
+ "Number=Sing|POS=PRON|PronType=Int":95,
433
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Fut|VerbForm=Fin":87,
434
+ "Mood=Imp|Number=Sing|POS=VERB|Person=3|VerbForm=Fin":100,
435
+ "Gender=Fem|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
436
+ "Gender=Masc|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
437
+ "POS=AUX|VerbForm=Ger":87,
438
+ "Gender=Fem|Number=Plur|POS=PRON|Person=3|PronType=Prs":95,
439
+ "Mood=Imp|Number=Sing|POS=AUX|Person=3|VerbForm=Fin":87,
440
+ "Number=Plur|POS=PRON|PronType=Ind":95,
441
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Dem":95,
442
+ "Case=Acc,Dat|Number=Sing|POS=PRON|Person=2|Polite=Infm|PrepCase=Npr|PronType=Prs":95,
443
+ "Gender=Masc|Number=Plur|POS=PRON|PronType=Int":95,
444
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin":87,
445
+ "NumForm=Digit|NumType=Frac|POS=NUM":93,
446
+ "Gender=Fem|Number=Plur|POS=PRON|PronType=Dem":95,
447
+ "Gender=Fem|POS=NOUN":92,
448
+ "Case=Acc,Dat|Number=Sing|POS=PRON|Person=1|PrepCase=Npr|PronType=Prs":95,
449
+ "Mood=Sub|Number=Plur|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin":100,
450
+ "Mood=Ind|Number=Plur|POS=AUX|Person=2|Tense=Fut|VerbForm=Fin":87,
451
+ "Mood=Sub|Number=Plur|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin":87,
452
+ "Mood=Sub|Number=Plur|POS=AUX|Person=3|Tense=Imp|VerbForm=Fin":87,
453
+ "Number=Plur|POS=PRON|Person=1|PronType=Prs":95,
454
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin":100,
455
+ "Case=Nom|Number=Sing|POS=PRON|Person=2|Polite=Infm|PronType=Prs":95,
456
+ "POS=X":101,
457
+ "Mood=Cnd|Number=Plur|POS=AUX|Person=1|VerbForm=Fin":87,
458
+ "Number=Sing|POS=DET|PronType=Dem":90,
459
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Fut|VerbForm=Fin":100,
460
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin":87,
461
+ "POS=DET|PronType=Art":90,
462
+ "Gender=Masc|Number=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs":95,
463
+ "NumType=Ord|Number=Sing|POS=ADJ":84,
464
+ "Number=Plur|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
465
+ "Number=Plur|POS=PRON|PronType=Dem":95,
466
+ "Mood=Imp|Number=Plur|POS=VERB|Person=1|VerbForm=Fin":100,
467
+ "POS=PRON|PronType=Ind":95,
468
+ "POS=SYM":99,
469
+ "Mood=Ind|Number=Sing|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin":100,
470
+ "Mood=Imp|Number=Plur|POS=VERB|Person=3|VerbForm=Fin":100,
471
+ "POS=VERB|VerbForm=Fin":100,
472
+ "Case=Nom|Number=Sing|POS=PRON|Person=1|PronType=Prs":95,
473
+ "Case=Acc|Number=Sing|POS=PRON|Person=1|PrepCase=Pre|PronType=Prs":95,
474
+ "Mood=Ind|Number=Sing|POS=AUX|Person=2|Tense=Pres|VerbForm=Fin":87,
475
+ "NumForm=Digit|NumType=Frac|POS=SYM":99,
476
+ "NumType=Card|Number=Sing|POS=NUM":93,
477
+ "POS=PUNCT|PunctSide=Ini|PunctType=Qest":97,
478
+ "POS=PUNCT|PunctSide=Fin|PunctType=Qest":97,
479
+ "NumForm=Digit|NumType=Ord|POS=ADJ":84,
480
+ "Foreign=Yes|POS=PRON|PronType=Int":95,
481
+ "Foreign=Yes|Mood=Ind|POS=VERB|VerbForm=Fin":100,
482
+ "Foreign=Yes|POS=ADP":85,
483
+ "Gender=Masc|Number=Sing|POS=PROPN":96,
484
+ "Case=Acc|POS=PRON|Person=3|PrepCase=Pre|PronType=Prs|Reflex=Yes":95,
485
+ "Mood=Ind|Number=Plur|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin":100,
486
+ "POS=PUNCT|PunctSide=Ini|PunctType=Excl":97,
487
+ "POS=PUNCT|PunctSide=Fin|PunctType=Excl":97,
488
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
489
+ "Mood=Cnd|Number=Sing|POS=VERB|Person=1|VerbForm=Fin":100,
490
+ "Mood=Ind|Number=Sing|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin":100,
491
+ "Gender=Masc|Number=Plur|POS=PRON|Person=3|Poss=Yes|PronType=Prs":95,
492
+ "POS=NUM":93,
493
+ "Mood=Imp|Number=Plur|POS=AUX|Person=3|VerbForm=Fin":87,
494
+ "Case=Nom|POS=PRON|Person=3|PronType=Prs":95,
495
+ "Mood=Cnd|Number=Sing|POS=AUX|Person=1|VerbForm=Fin":87,
496
+ "Number=Plur|POS=PRON|Person=2|Polite=Form|PronType=Prs":95,
497
+ "Mood=Sub|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin":87,
498
+ "POS=PUNCT|PunctSide=Ini|PunctType=Comm":97,
499
+ "POS=PUNCT|PunctSide=Fin|PunctType=Comm":97,
500
+ "Number=Plur|POS=PRON|Person=2|PronType=Prs":95,
501
+ "Mood=Ind|Number=Plur|POS=AUX|Person=2|Tense=Pres|VerbForm=Fin":87,
502
+ "Case=Acc,Dat|Number=Plur|POS=PRON|Person=2|PronType=Prs":95,
503
+ "Mood=Cnd|Number=Plur|POS=VERB|Person=1|VerbForm=Fin":100,
504
+ "Mood=Ind|Number=Plur|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin":87,
505
+ "Gender=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=1|Poss=Yes|PronType=Prs":90,
506
+ "Mood=Ind|Number=Plur|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin":100,
507
+ "Mood=Sub|Number=Plur|POS=VERB|Person=1|Tense=Pres|VerbForm=Fin":100,
508
+ "Definite=Ind|Gender=Masc|Number=Sing|POS=DET|PronType=Art":90,
509
+ "Number=Sing|POS=PRON|Person=2|Polite=Form|PronType=Prs":95,
510
+ "Gender=Masc|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
511
+ "POS=VERB|Tense=Past|VerbForm=Part":100,
512
+ "Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Past|VerbForm=Fin":87,
513
+ "Foreign=Yes|POS=NOUN":92,
514
+ "Definite=Def|Foreign=Yes|Gender=Masc|Number=Sing|POS=DET|PronType=Art":90,
515
+ "Foreign=Yes|POS=VERB":100,
516
+ "Foreign=Yes|POS=ADJ":84,
517
+ "Foreign=Yes|POS=DET":90,
518
+ "Foreign=Yes|POS=ADV":86,
519
+ "Definite=Ind|Gender=Fem|Number=Plur|POS=DET|PronType=Art":90,
520
+ "POS=INTJ":91,
521
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin":87,
522
+ "Mood=Sub|Number=Sing|POS=VERB|Person=2|Tense=Pres|VerbForm=Fin":100,
523
+ "Case=Acc|POS=PRON|Person=3|PronType=Prs|Reflex=Yes":95,
524
+ "AdvType=Tim|POS=SYM":99,
525
+ "Gender=Fem|Number=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs":95,
526
+ "Definite=Ind|Gender=Fem|Number=Sing|POS=DET|PronType=Art":90,
527
+ "AdvType=Tim|Degree=Cmp|POS=ADV":86,
528
+ "Case=Acc|Number=Sing|POS=PRON|Person=2|Polite=Infm|PrepCase=Pre|PronType=Prs":95,
529
+ "Mood=Sub|Number=Plur|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin":100,
530
+ "Degree=Cmp|POS=ADJ":84,
531
+ "POS=DET":90,
532
+ "Gender=Masc|Number=Sing|Number[psor]=Plur|POS=PRON|Person=1|Poss=Yes|PronType=Prs":95,
533
+ "Number=Plur|Number[psor]=Plur|POS=PRON|Person=1|Poss=Yes|PronType=Prs":95,
534
+ "Mood=Ind|Number=Plur|POS=VERB|Person=2|Tense=Fut|VerbForm=Fin":100,
535
+ "Mood=Sub|Number=Sing|POS=AUX|Person=1|Tense=Pres|VerbForm=Fin":87,
536
+ "Gender=Masc|POS=SYM":99,
537
+ "Mood=Ind|Number=Plur|POS=VERB|Person=3|Tense=Past|VerbForm=Fin":100,
538
+ "Mood=Sub|Number=Sing|POS=VERB|Person=1|Tense=Imp|VerbForm=Fin":100,
539
+ "POS=DET|PronType=Rel":90,
540
+ "Gender=Fem|NumType=Card|POS=NUM":93,
541
+ "Mood=Ind|Number=Plur|POS=AUX|Person=3|Tense=Past|VerbForm=Fin":87,
542
+ "Mood=Sub|Number=Plur|POS=AUX|Person=1|Tense=Imp|VerbForm=Fin":87,
543
+ "POS=AUX|Tense=Past|VerbForm=Part":87,
544
+ "Foreign=Yes|Mood=Ind|Number=Sing|POS=AUX|Person=3|Tense=Pres|VerbForm=Fin":87,
545
+ "Foreign=Yes|Gender=Masc|Number=Sing|POS=PRON|Person=3|PronType=Prs":95,
546
+ "Foreign=Yes|POS=SCONJ":98,
547
+ "Foreign=Yes|Gender=Fem|Number=Sing|POS=DET|PronType=Art":90,
548
+ "Mood=Ind|Number=Sing|POS=AUX|Person=1|Tense=Fut|VerbForm=Fin":87,
549
+ "Number=Sing|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
550
+ "Gender=Fem|Number=Sing|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
551
+ "Gender=Fem|Number=Sing|Number[psor]=Sing|POS=PRON|Person=3|Poss=Yes|PronType=Prs":95,
552
+ "Gender=Masc|Number=Plur|Number[psor]=Sing|POS=DET|Person=2|Poss=Yes|PronType=Prs":90,
553
+ "Definite=Ind|Number=Sing|POS=DET|PronType=Art":90,
554
+ "Gender=Fem|Number=Plur|POS=PRON|Person=3|Poss=Yes|PronType=Prs":95,
555
+ "Gender=Fem|Number=Sing|POS=PROPN":96,
556
+ "Number=Plur|POS=DET|PronType=Dem":90,
557
+ "Gender=Masc|Number=Sing|POS=PRON|PronType=Rel":95
558
+ },
559
+ "overwrite":true
560
+ }
morphologizer/model ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c60ef13dd03a412f3c6613a062f2e5ed611196a9fffa6f52cbf9f975d923acea
3
+ size 1132253
ner/cfg ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "moves":null,
3
+ "update_with_oracle_cut_size":100,
4
+ "multitasks":[
5
+
6
+ ],
7
+ "min_action_freq":1,
8
+ "learn_tokens":false,
9
+ "beam_width":1,
10
+ "beam_density":0.0,
11
+ "beam_update_prob":0.0,
12
+ "incorrect_spans_key":null
13
+ }
ner/model ADDED
Binary file (291 kB). View file
ner/moves ADDED
@@ -0,0 +1 @@
 
1
+ ��moves��{"0":{},"1":{"ORG":15556,"PER":10543,"LOC":9567,"MISC":7347},"2":{"ORG":15556,"PER":10543,"LOC":9567,"MISC":7347},"3":{"ORG":15556,"PER":10543,"LOC":9567,"MISC":7347},"4":{"ORG":15556,"PER":10543,"LOC":9567,"MISC":7347,"":1},"5":{"":1}}�cfg��neg_key�
parser/cfg ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "moves":null,
3
+ "update_with_oracle_cut_size":100,
4
+ "multitasks":[
5
+
6
+ ],
7
+ "min_action_freq":30,
8
+ "learn_tokens":false,
9
+ "beam_width":1,
10
+ "beam_density":0.0,
11
+ "beam_update_prob":0.0,
12
+ "incorrect_spans_key":null
13
+ }
parser/model ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56054528ac95d4a9dc740ce78c06c11baecab53f74076b23038b230694b429b8
3
+ size 1281839
parser/moves ADDED
@@ -0,0 +1 @@
 
1
+ ��moves�<{"0":{"":237803},"1":{"":178217},"2":{"det":66991,"case":59921,"punct":19433,"nsubj":17895,"aux":12982,"mark":11915,"cc":11480,"obj":8456,"advmod":8167,"obl":5001,"amod":4265,"cop":3586,"nummod":3527,"nmod":930,"advcl":803,"iobj":575,"ccomp":402,"expl:pass":390,"fixed||case":274,"csubj":203,"parataxis":202,"xcomp":201,"dep":0},"3":{"nmod":30887,"punct":25535,"obj":20526,"amod":15343,"flat":13631,"conj":12915,"obl":11983,"acl":7493,"fixed":7386,"appos":5875,"advcl":4544,"advmod":3902,"nsubj":3670,"ccomp":3086,"xcomp":2847,"compound":2627,"case":1121,"det":970,"nummod":936,"csubj":656,"iobj":629,"parataxis":229,"flat||det":190,"mark":172,"aux":170,"cop":145,"obj||xcomp":95,"appos||det":78,"conj||xcomp":61,"dep":57,"advcl||xcomp":53,"fixed||case":43,"obl||xcomp":39,"mark||xcomp":32,"xcomp||xcomp":30},"4":{"ROOT":13123}}�cfg��neg_key�
tagger/cfg ADDED
@@ -0,0 +1,297 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "labels":[
3
+ "ADJ",
4
+ "ADP",
5
+ "ADV",
6
+ "AUX",
7
+ "CCONJ",
8
+ "DET",
9
+ "INTJ",
10
+ "NOUN",
11
+ "NUM",
12
+ "PART",
13
+ "PRON",
14
+ "PROPN",
15
+ "PUNCT",
16
+ "SCONJ",
17
+ "SYM",
18
+ "VERB",
19
+ "ao0cs0",
20
+ "ao0fp0",
21
+ "ao0fs0",
22
+ "ao0mp0",
23
+ "ao0ms0",
24
+ "aq0cn0",
25
+ "aq0cp0",
26
+ "aq0cp00",
27
+ "aq0cs0",
28
+ "aq0fp0",
29
+ "aq0fpp",
30
+ "aq0fs0",
31
+ "aq0fsp",
32
+ "aq0mp0",
33
+ "aq0mpp",
34
+ "aq0ms0",
35
+ "aq0msp",
36
+ "cc",
37
+ "cs",
38
+ "da0cs0",
39
+ "da0fp0",
40
+ "da0fs0",
41
+ "da0mp0",
42
+ "da0ms0",
43
+ "dd0cp0",
44
+ "dd0cs0",
45
+ "dd0fp0",
46
+ "dd0fs0",
47
+ "dd0mp0",
48
+ "dd0ms0",
49
+ "de0cn0",
50
+ "di0cn0",
51
+ "di0cp0",
52
+ "di0cs0",
53
+ "di0fp0",
54
+ "di0fs0",
55
+ "di0mp0",
56
+ "di0ms0",
57
+ "dn0cp0",
58
+ "dn0cs0",
59
+ "dn0fp0",
60
+ "dn0fs0",
61
+ "dn0mp0",
62
+ "dn0ms0",
63
+ "dp1cpp",
64
+ "dp1fpp",
65
+ "dp1fps",
66
+ "dp1fsp",
67
+ "dp1fss",
68
+ "dp1mpp",
69
+ "dp1mps",
70
+ "dp1msp",
71
+ "dp1mss",
72
+ "dp2fss",
73
+ "dp2mps",
74
+ "dp2mss",
75
+ "dp3fp0",
76
+ "dp3fs0",
77
+ "dp3mp0",
78
+ "dp3ms0",
79
+ "dr0cs0",
80
+ "dt0fp0",
81
+ "dt0fs0",
82
+ "dt0mp0",
83
+ "dt0ms0",
84
+ "faa",
85
+ "fat",
86
+ "fc",
87
+ "fca",
88
+ "fct",
89
+ "fd",
90
+ "fe",
91
+ "fg",
92
+ "fh",
93
+ "fia",
94
+ "fit",
95
+ "fp",
96
+ "fpa",
97
+ "fpt",
98
+ "fs",
99
+ "fx",
100
+ "fz",
101
+ "nc00000",
102
+ "nccn000",
103
+ "nccp000",
104
+ "nccs000",
105
+ "ncfn000",
106
+ "ncfp000",
107
+ "ncfs000",
108
+ "ncmn000",
109
+ "ncmp000",
110
+ "ncms000",
111
+ "np00000",
112
+ "np0000a",
113
+ "np0000d",
114
+ "np0000l",
115
+ "np0000o",
116
+ "np0000p",
117
+ "p0000000",
118
+ "p010p000",
119
+ "p010s000",
120
+ "p020p000",
121
+ "p020s000",
122
+ "p0300000",
123
+ "pd0cp000",
124
+ "pd0cs000",
125
+ "pd0fp000",
126
+ "pd0fs000",
127
+ "pd0mp000",
128
+ "pd0ms000",
129
+ "pd0ns000",
130
+ "pi0cn000",
131
+ "pi0cp000",
132
+ "pi0cs000",
133
+ "pi0fp000",
134
+ "pi0fs000",
135
+ "pi0mp0",
136
+ "pi0mp000",
137
+ "pi0ms000",
138
+ "pn0cp000",
139
+ "pn0cs000",
140
+ "pn0fp000",
141
+ "pn0fs000",
142
+ "pn0mp000",
143
+ "pn0ms000",
144
+ "pp1cp000",
145
+ "pp1cs000",
146
+ "pp1csn00",
147
+ "pp1cso00",
148
+ "pp2cp000",
149
+ "pp2cp00p",
150
+ "pp2cs000",
151
+ "pp2cs00p",
152
+ "pp3cn000",
153
+ "pp3cno00",
154
+ "pp3cp000",
155
+ "pp3csa00",
156
+ "pp3csd00",
157
+ "pp3fp000",
158
+ "pp3fpa00",
159
+ "pp3fs000",
160
+ "pp3fsa00",
161
+ "pp3mp000",
162
+ "pp3mpa00",
163
+ "pp3ms000",
164
+ "pp3msa00",
165
+ "pp3nn000",
166
+ "pr000000",
167
+ "pr0cn000",
168
+ "pr0cp000",
169
+ "pr0cs0",
170
+ "pr0cs000",
171
+ "pr0ms000",
172
+ "pt000000",
173
+ "pt0cs000",
174
+ "pt0fp000",
175
+ "pt0fs000",
176
+ "pt0mp000",
177
+ "pt0ms000",
178
+ "px1fp0p0",
179
+ "px1fs0p0",
180
+ "px1ms0p0",
181
+ "px3cp0p0",
182
+ "px3cs0p0",
183
+ "px3fp0s0",
184
+ "px3fs000",
185
+ "px3fs0s0",
186
+ "px3mp000",
187
+ "px3ms000",
188
+ "rg",
189
+ "rn",
190
+ "spcmp",
191
+ "spcms",
192
+ "sps00",
193
+ "vag0000",
194
+ "vaic1p0",
195
+ "vaic3p0",
196
+ "vaic3s0",
197
+ "vaif1p0",
198
+ "vaif1s0",
199
+ "vaif2p0",
200
+ "vaif3p0",
201
+ "vaif3s0",
202
+ "vaii1p0",
203
+ "vaii1s0",
204
+ "vaii3p0",
205
+ "vaii3s0",
206
+ "vaip1p0",
207
+ "vaip1s0",
208
+ "vaip2p0",
209
+ "vaip2s0",
210
+ "vaip3p0",
211
+ "vaip3s0",
212
+ "van0000",
213
+ "vap00sm",
214
+ "vasi100",
215
+ "vasi1p0",
216
+ "vasi3p0",
217
+ "vasi3s0",
218
+ "vasp1p0",
219
+ "vasp3p0",
220
+ "vasp3s0",
221
+ "vm00000",
222
+ "vmg0000",
223
+ "vmic1p0",
224
+ "vmic1s0",
225
+ "vmic3p0",
226
+ "vmic3s0",
227
+ "vmif1p0",
228
+ "vmif1s0",
229
+ "vmif2p0",
230
+ "vmif3p0",
231
+ "vmif3s0",
232
+ "vmii1p0",
233
+ "vmii1s0",
234
+ "vmii3p0",
235
+ "vmii3s0",
236
+ "vmip1p0",
237
+ "vmip1s0",
238
+ "vmip2p0",
239
+ "vmip2s0",
240
+ "vmip3p0",
241
+ "vmip3s0",
242
+ "vmis3p0",
243
+ "vmis3s0",
244
+ "vmm01p0",
245
+ "vmm02s0",
246
+ "vmm03p0",
247
+ "vmm03s0",
248
+ "vmn0000",
249
+ "vmp0000",
250
+ "vmp00fs",
251
+ "vmp00mp",
252
+ "vmp00ms",
253
+ "vmp00pf",
254
+ "vmp00pm",
255
+ "vmp00sf",
256
+ "vmp00sm",
257
+ "vmsi1p0",
258
+ "vmsi1s0",
259
+ "vmsi3p0",
260
+ "vmsi3s0",
261
+ "vmsp1p0",
262
+ "vmsp1s0",
263
+ "vmsp2p0",
264
+ "vmsp2s0",
265
+ "vmsp3p0",
266
+ "vmsp3s0",
267
+ "vsg0000",
268
+ "vsic3p0",
269
+ "vsic3s0",
270
+ "vsif3p0",
271
+ "vsif3s0",
272
+ "vsii1p0",
273
+ "vsii1s0",
274
+ "vsii3p0",
275
+ "vsii3s0",
276
+ "vsip1p0",
277
+ "vsip1s0",
278
+ "vsip2s0",
279
+ "vsip3p0",
280
+ "vsip3s0",
281
+ "vsis3p0",
282
+ "vsis3s0",
283
+ "vsm03p0",
284
+ "vsm03s0",
285
+ "vsn0000",
286
+ "vsp00sm",
287
+ "vssi3p0",
288
+ "vssi3s0",
289
+ "vssp1p0",
290
+ "vssp3p0",
291
+ "vssp3s0",
292
+ "zm",
293
+ "zp"
294
+ ],
295
+ "neg_prefix":"!",
296
+ "overwrite":false
297
+ }
tagger/model ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8e67e8cfc58bd24e3991814d534c121290a707c752f9df782dac8777bb1be7d
3
+ size 1193753
tokenizer ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ ��prefix_search� �^§|^%|^=|^—|^–|^-|^\+(?![0-9])|^…|^……|^,|^:|^;|^\!|^\?|^¿|^؟|^¡|^\(|^\)|^\[|^\]|^\{|^\}|^<|^>|^_|^#|^\*|^&|^。|^?|^!|^,|^、|^;|^:|^~|^·|^।|^،|^۔|^؛|^٪|^\.\.+|^…|^\'|^"|^”|^“|^`|^‘|^´|^’|^‚|^,|^„|^»|^«|^「|^」|^『|^』|^(|^)|^〔|^〕|^【|^】|^《|^》|^〈|^〉|^\$|^£|^€|^¥|^฿|^US\$|^C\$|^A\$|^₽|^﷼|^₴|^₠|^₡|^₢|^₣|^₤|^₥|^₦|^₧|^₨|^₩|^₪|^₫|^€|^₭|^₮|^₯|^₰|^₱|^₲|^₳|^₴|^₵|^₶|^₷|^₸|^₹|^₺|^₻|^₼|^₽|^₾|^₿|^[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]�suffix_search�2f…$|……$|,$|:$|;$|\!$|\?$|¿$|؟$|¡$|\($|\)$|\[$|\]$|\{$|\}$|<$|>$|_$|#$|\*$|&$|。$|?$|!$|,$|、$|;$|:$|~$|·$|।$|،$|۔$|؛$|٪$|\.\.+$|…$|\'$|"$|”$|“$|`$|‘$|´$|’$|‚$|,$|„$|»$|«$|「$|」$|『$|』$|($|)$|〔$|〕$|【$|】$|《$|》$|〈$|〉$|[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]$|-$|—$|–$|(?<=[0-9])\+$|(?<=°[FfCcKk])\.$|(?<=[0-9])(?:\$|£|€|¥|฿|US\$|C\$|A\$|₽|﷼|₴|₠|₡|₢|₣|₤|₥|₦|₧|₨|₩|₪|₫|€|₭|₮|₯|₰|₱|₲|₳|₴|₵|₶|₷|₸|₹|₺|₻|₼|₽|₾|₿)$|(?<=[0-9])(?:km|km²|km³|m|m²|m³|dm|dm²|dm³|cm|cm²|cm³|mm|mm²|mm³|ha|µm|nm|yd|in|ft|kg|g|mg|µg|t|lb|oz|m/s|km/h|kmh|mph|hPa|Pa|mbar|mb|MB|kb|KB|gb|GB|tb|TB|T|G|M|K|км|км²|км³|м|м²|м³|дм|дм²|дм³|см|см²|см³|мм|мм²|мм³|нм|кг|г|мг|м/с|км/ч|кПа|Па|мбар|Кб|КБ|кб|Мб|МБ|мб|Гб|ГБ|гб|Тб|ТБ|тбكم|كم²|كم³|م|م²|م³|سم|سم²|سم³|مم|مم²|مم³|كم|غرام|جرام|جم|كغ|ملغ|كوب|اكواب)$|(?<=[0-9a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F%²\-\+…|……|,|:|;|\!|\?|¿|؟|¡|\(|\)|\[|\]|\{|\}|<|>|_|#|\*|&|。|?|!|,|、|;|:|~|·|।|،|۔|؛|٪(?:\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉)])\.$|(?<=[A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F][A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])\.$�infix_finditer�?9\.\.+|…|[\u00A6\u00A9\u00AE\u00B0\u0482\u058D\u058E\u060E\u060F\u06DE\u06E9\u06FD\u06FE\u07F6\u09FA\u0B70\u0BF3-\u0BF8\u0BFA\u0C7F\u0D4F\u0D79\u0F01-\u0F03\u0F13\u0F15-\u0F17\u0F1A-\u0F1F\u0F34\u0F36\u0F38\u0FBE-\u0FC5\u0FC7-\u0FCC\u0FCE\u0FCF\u0FD5-\u0FD8\u109E\u109F\u1390-\u1399\u1940\u19DE-\u19FF\u1B61-\u1B6A\u1B74-\u1B7C\u2100\u2101\u2103-\u2106\u2108\u2109\u2114\u2116\u2117\u211E-\u2123\u2125\u2127\u2129\u212E\u213A\u213B\u214A\u214C\u214D\u214F\u218A\u218B\u2195-\u2199\u219C-\u219F\u21A1\u21A2\u21A4\u21A5\u21A7-\u21AD\u21AF-\u21CD\u21D0\u21D1\u21D3\u21D5-\u21F3\u2300-\u2307\u230C-\u231F\u2322-\u2328\u232B-\u237B\u237D-\u239A\u23B4-\u23DB\u23E2-\u2426\u2440-\u244A\u249C-\u24E9\u2500-\u25B6\u25B8-\u25C0\u25C2-\u25F7\u2600-\u266E\u2670-\u2767\u2794-\u27BF\u2800-\u28FF\u2B00-\u2B2F\u2B45\u2B46\u2B4D-\u2B73\u2B76-\u2B95\u2B98-\u2BC8\u2BCA-\u2BFE\u2CE5-\u2CEA\u2E80-\u2E99\u2E9B-\u2EF3\u2F00-\u2FD5\u2FF0-\u2FFB\u3004\u3012\u3013\u3020\u3036\u3037\u303E\u303F\u3190\u3191\u3196-\u319F\u31C0-\u31E3\u3200-\u321E\u322A-\u3247\u3250\u3260-\u327F\u328A-\u32B0\u32C0-\u32FE\u3300-\u33FF\u4DC0-\u4DFF\uA490-\uA4C6\uA828-\uA82B\uA836\uA837\uA839\uAA77-\uAA79\uFDFD\uFFE4\uFFE8\uFFED\uFFEE\uFFFC\uFFFD\U00010137-\U0001013F\U00010179-\U00010189\U0001018C-\U0001018E\U00010190-\U0001019B\U000101A0\U000101D0-\U000101FC\U00010877\U00010878\U00010AC8\U0001173F\U00016B3C-\U00016B3F\U00016B45\U0001BC9C\U0001D000-\U0001D0F5\U0001D100-\U0001D126\U0001D129-\U0001D164\U0001D16A-\U0001D16C\U0001D183\U0001D184\U0001D18C-\U0001D1A9\U0001D1AE-\U0001D1E8\U0001D200-\U0001D241\U0001D245\U0001D300-\U0001D356\U0001D800-\U0001D9FF\U0001DA37-\U0001DA3A\U0001DA6D-\U0001DA74\U0001DA76-\U0001DA83\U0001DA85\U0001DA86\U0001ECAC\U0001F000-\U0001F02B\U0001F030-\U0001F093\U0001F0A0-\U0001F0AE\U0001F0B1-\U0001F0BF\U0001F0C1-\U0001F0CF\U0001F0D1-\U0001F0F5\U0001F110-\U0001F16B\U0001F170-\U0001F1AC\U0001F1E6-\U0001F202\U0001F210-\U0001F23B\U0001F240-\U0001F248\U0001F250\U0001F251\U0001F260-\U0001F265\U0001F300-\U0001F3FA\U0001F400-\U0001F6D4\U0001F6E0-\U0001F6EC\U0001F6F0-\U0001F6F9\U0001F700-\U0001F773\U0001F780-\U0001F7D8\U0001F800-\U0001F80B\U0001F810-\U0001F847\U0001F850-\U0001F859\U0001F860-\U0001F887\U0001F890-\U0001F8AD\U0001F900-\U0001F90B\U0001F910-\U0001F93E\U0001F940-\U0001F970\U0001F973-\U0001F976\U0001F97A\U0001F97C-\U0001F9A2\U0001F9B0-\U0001F9B9\U0001F9C0-\U0001F9C2\U0001F9D0-\U0001F9FF\U0001FA60-\U0001FA6D]|(?<=[0-9])[+\-\*^](?=[0-9-])|(?<=[a-z\uFF41-\uFF5A\u00DF-\u00F6\u00F8-\u00FF\u0101\u0103\u0105\u0107\u0109\u010B\u010D\u010F\u0111\u0113\u0115\u0117\u0119\u011B\u011D\u011F\u0121\u0123\u0125\u0127\u0129\u012B\u012D\u012F\u0131\u0133\u0135\u0137\u0138\u013A\u013C\u013E\u0140\u0142\u0144\u0146\u0148\u0149\u014B\u014D\u014F\u0151\u0153\u0155\u0157\u0159\u015B\u015D\u015F\u0161\u0163\u0165\u0167\u0169\u016B\u016D\u016F\u0171\u0173\u0175\u0177\u017A\u017C\u017E\u017F\u0180\u0183\u0185\u0188\u018C\u018D\u0192\u0195\u0199-\u019B\u019E\u01A1\u01A3\u01A5\u01A8\u01AA\u01AB\u01AD\u01B0\u01B4\u01B6\u01B9\u01BA\u01BD-\u01BF\u01C6\u01C9\u01CC\u01CE\u01D0\u01D2\u01D4\u01D6\u01D8\u01DA\u01DC\u01DD\u01DF\u01E1\u01E3\u01E5\u01E7\u01E9\u01EB\u01ED\u01EF\u01F0\u01F3\u01F5\u01F9\u01FB\u01FD\u01FF\u0201\u0203\u0205\u0207\u0209\u020B\u020D\u020F\u0211\u0213\u0215\u0217\u0219\u021B\u021D\u021F\u0221\u0223\u0225\u0227\u0229\u022B\u022D\u022F\u0231\u0233-\u0239\u023C\u023F\u0240\u0242\u0247\u0249\u024B\u024D\u024F\u2C61\u2C65\u2C66\u2C68\u2C6A\u2C6C\u2C71\u2C73\u2C74\u2C76-\u2C7B\uA723\uA725\uA727\uA729\uA72B\uA72D\uA72F-\uA731\uA733\uA735\uA737\uA739\uA73B\uA73D\uA73F\uA741\uA743\uA745\uA747\uA749\uA74B\uA74D\uA74F\uA751\uA753\uA755\uA757\uA759\uA75B\uA75D\uA75F\uA761\uA763\uA765\uA767\uA769\uA76B\uA76D\uA76F\uA771-\uA778\uA77A\uA77C\uA77F\uA781\uA783\uA785\uA787\uA78C\uA78E\uA791\uA793-\uA795\uA797\uA799\uA79B\uA79D\uA79F\uA7A1\uA7A3\uA7A5\uA7A7\uA7A9\uA7AF\uA7B5\uA7B7\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E01\u1E03\u1E05\u1E07\u1E09\u1E0B\u1E0D\u1E0F\u1E11\u1E13\u1E15\u1E17\u1E19\u1E1B\u1E1D\u1E1F\u1E21\u1E23\u1E25\u1E27\u1E29\u1E2B\u1E2D\u1E2F\u1E31\u1E33\u1E35\u1E37\u1E39\u1E3B\u1E3D\u1E3F\u1E41\u1E43\u1E45\u1E47\u1E49\u1E4B\u1E4D\u1E4F\u1E51\u1E53\u1E55\u1E57\u1E59\u1E5B\u1E5D\u1E5F\u1E61\u1E63\u1E65\u1E67\u1E69\u1E6B\u1E6D\u1E6F\u1E71\u1E73\u1E75\u1E77\u1E79\u1E7B\u1E7D\u1E7F\u1E81\u1E83\u1E85\u1E87\u1E89\u1E8B\u1E8D\u1E8F\u1E91\u1E93\u1E95-\u1E9D\u1E9F\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7\u1EB9\u1EBB\u1EBD\u1EBF\u1EC1\u1EC3\u1EC5\u1EC7\u1EC9\u1ECB\u1ECD\u1ECF\u1ED1\u1ED3\u1ED5\u1ED7\u1ED9\u1EDB\u1EDD\u1EDF\u1EE1\u1EE3\u1EE5\u1EE7\u1EE9\u1EEB\u1EED\u1EEF\u1EF1\u1EF3\u1EF5\u1EF7\u1EF9\u1EFB\u1EFD\u1EFFёа-яәөүҗңһα-ωάέίόώήύа-щюяіїєґѓѕјљњќѐѝ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉])\.(?=[A-Z\uFF21-\uFF3A\u00C0-\u00D6\u00D8-\u00DE\u0100\u0102\u0104\u0106\u0108\u010A\u010C\u010E\u0110\u0112\u0114\u0116\u0118\u011A\u011C\u011E\u0120\u0122\u0124\u0126\u0128\u012A\u012C\u012E\u0130\u0132\u0134\u0136\u0139\u013B\u013D\u013F\u0141\u0143\u0145\u0147\u014A\u014C\u014E\u0150\u0152\u0154\u0156\u0158\u015A\u015C\u015E\u0160\u0162\u0164\u0166\u0168\u016A\u016C\u016E\u0170\u0172\u0174\u0176\u0178\u0179\u017B\u017D\u0181\u0182\u0184\u0186\u0187\u0189-\u018B\u018E-\u0191\u0193\u0194\u0196-\u0198\u019C\u019D\u019F\u01A0\u01A2\u01A4\u01A6\u01A7\u01A9\u01AC\u01AE\u01AF\u01B1-\u01B3\u01B5\u01B7\u01B8\u01BC\u01C4\u01C7\u01CA\u01CD\u01CF\u01D1\u01D3\u01D5\u01D7\u01D9\u01DB\u01DE\u01E0\u01E2\u01E4\u01E6\u01E8\u01EA\u01EC\u01EE\u01F1\u01F4\u01F6-\u01F8\u01FA\u01FC\u01FE\u0200\u0202\u0204\u0206\u0208\u020A\u020C\u020E\u0210\u0212\u0214\u0216\u0218\u021A\u021C\u021E\u0220\u0222\u0224\u0226\u0228\u022A\u022C\u022E\u0230\u0232\u023A\u023B\u023D\u023E\u0241\u0243-\u0246\u0248\u024A\u024C\u024E\u2C60\u2C62-\u2C64\u2C67\u2C69\u2C6B\u2C6D-\u2C70\u2C72\u2C75\u2C7E\u2C7F\uA722\uA724\uA726\uA728\uA72A\uA72C\uA72E\uA732\uA734\uA736\uA738\uA73A\uA73C\uA73E\uA740\uA742\uA744\uA746\uA748\uA74A\uA74C\uA74E\uA750\uA752\uA754\uA756\uA758\uA75A\uA75C\uA75E\uA760\uA762\uA764\uA766\uA768\uA76A\uA76C\uA76E\uA779\uA77B\uA77D\uA77E\uA780\uA782\uA784\uA786\uA78B\uA78D\uA790\uA792\uA796\uA798\uA79A\uA79C\uA79E\uA7A0\uA7A2\uA7A4\uA7A6\uA7A8\uA7AA-\uA7AE\uA7B0-\uA7B4\uA7B6\uA7B8\u1E00\u1E02\u1E04\u1E06\u1E08\u1E0A\u1E0C\u1E0E\u1E10\u1E12\u1E14\u1E16\u1E18\u1E1A\u1E1C\u1E1E\u1E20\u1E22\u1E24\u1E26\u1E28\u1E2A\u1E2C\u1E2E\u1E30\u1E32\u1E34\u1E36\u1E38\u1E3A\u1E3C\u1E3E\u1E40\u1E42\u1E44\u1E46\u1E48\u1E4A\u1E4C\u1E4E\u1E50\u1E52\u1E54\u1E56\u1E58\u1E5A\u1E5C\u1E5E\u1E60\u1E62\u1E64\u1E66\u1E68\u1E6A\u1E6C\u1E6E\u1E70\u1E72\u1E74\u1E76\u1E78\u1E7A\u1E7C\u1E7E\u1E80\u1E82\u1E84\u1E86\u1E88\u1E8A\u1E8C\u1E8E\u1E90\u1E92\u1E94\u1E9E\u1EA0\u1EA2\u1EA4\u1EA6\u1EA8\u1EAA\u1EAC\u1EAE\u1EB0\u1EB2\u1EB4\u1EB6\u1EB8\u1EBA\u1EBC\u1EBE\u1EC0\u1EC2\u1EC4\u1EC6\u1EC8\u1ECA\u1ECC\u1ECE\u1ED0\u1ED2\u1ED4\u1ED6\u1ED8\u1EDA\u1EDC\u1EDE\u1EE0\u1EE2\u1EE4\u1EE6\u1EE8\u1EEA\u1EEC\u1EEE\u1EF0\u1EF2\u1EF4\u1EF6\u1EF8\u1EFA\u1EFC\u1EFEЁА-ЯӘӨҮҖҢҺΑ-ΩΆΈΊΌΏΉΎА-ЩЮЯІЇЄҐЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F\'"”“`‘´’‚,„»«「」『』()〔〕【】《》〈〉])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F]),(?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F0-9])[:<>=/](?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F])|(?<=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F]['’])(?=[A-Za-z\uFF21-\uFF3A\uFF41-\uFF5A\u00C0-\u00D6\u00D8-\u00F6\u00F8-\u00FF\u0100-\u017F\u0180-\u01BF\u01C4-\u024F\u2C60-\u2C7B\u2C7E\u2C7F\uA722-\uA76F\uA771-\uA787\uA78B-\uA78E\uA790-\uA7B9\uA7FA\uAB30-\uAB5A\uAB60-\uAB64\u0250-\u02AF\u1D00-\u1D25\u1D6B-\u1D77\u1D79-\u1D9A\u1E00-\u1EFFёа-яЁА-ЯәөүҗңһӘӨҮҖҢҺα-ωάέίόώήύΑ-ΩΆΈΊΌΏΉΎа-щюяіїєґА-ЩЮЯІЇЄҐѓѕјљњќѐѝЃЅЈЉЊЌЀЍ\u1200-\u137F\u0980-\u09FF\u0591-\u05F4\uFB1D-\uFB4F\u0620-\u064A\u066E-\u06D5\u06E5-\u06FF\u0750-\u077F\u08A0-\u08BD\uFB50-\uFBB1\uFBD3-\uFD3D\uFD50-\uFDC7\uFDF0-\uFDFB\uFE70-\uFEFC\U0001EE00-\U0001EEBB\u0D80-\u0DFF\u0900-\u097F\u0C80-\u0CFF\u0B80-\u0BFF\u0C00-\u0C7F\uAC00-\uD7AF\u1100-\u11FF\u3040-\u309F\u30A0-\u30FFー\u4E00-\u62FF\u6300-\u77FF\u7800-\u8CFF\u8D00-\u9FFF\u3400-\u4DBF\U00020000-\U000215FF\U00021600-\U000230FF\U00023100-\U000245FF\U00024600-\U000260FF\U00026100-\U000275FF\U00027600-\U000290FF\U00029100-\U0002A6DF\U0002A700-\U0002B73F\U0002B740-\U0002B81F\U0002B820-\U0002CEAF\U0002CEB0-\U0002EBEF\u2E80-\u2EFF\u2F00-\u2FDF\u2FF0-\u2FFF\u3000-\u303F\u31C0-\u31EF\u3200-\u32FF\u3300-\u33FF\uF900-\uFAFF\uFE30-\uFE4F\U0001F200-\U0001F2FF\U0002F800-\U0002FA1F0-9])|('ls|'l|'ns|'t|'m|'n|-les|-la|-lo|-li|-los|-me|-nos|-te|-vos|-se|-hi|-ne|-ho)(?![A-Za-z])|(-l'|-m'|-t'|-n')�token_match��url_match�
2
+ ��A�
3
+ � ��A� �'��A�'�''��A�''�'l��A�'l�'ls��A�'ls�'m��A�'m�'n��A�'n�'ns��A�'ns�'s��A�'s�'t��A�'t�(*_*)��A�(*_*)�(-8��A�(-8�(-:��A�(-:�(-;��A�(-;�(-_-)��A�(-_-)�(._.)��A�(._.)�(:��A�(:�(;��A�(;�(=��A�(=�(>_<)��A�(>_<)�(^_^)��A�(^_^)�(o:��A�(o:�(¬_¬)��A�(¬_¬)�(ಠ_ಠ)��A�(ಠ_ಠ)�(╯°□°)╯︵┻━┻��A�(╯°□°)╯︵┻━┻�)-:��A�)-:�):��A�):�-_-��A�-_-�-__-��A�-__-�._.��A�._.�0.0��A�0.0�0.o��A�0.o�0_0��A�0_0�0_o��A�0_o�10a.m.��A�10�A�a.m.C�a.m.�10am��A�10�A�amC�a.m.�10p.m.��A�10�A�p.m.C�p.m.�10pm��A�10�A�pmC�p.m.�11a.m.��A�11�A�a.m.C�a.m.�11am��A�11�A�amC�a.m.�11p.m.��A�11�A�p.m.C�p.m.�11pm��A�11�A�pmC�p.m.�12a.m.��A�12�A�a.m.C�a.m.�12am��A�12�A�amC�a.m.�12m.��A�12�A�m.C�p.m.�12p.m.��A�12�A�p.m.C�p.m.�12pm��A�12�A�pmC�p.m.�1a.m.��A�1�A�a.m.C�a.m.�1am��A�1�A�amC�a.m.�1p.m.��A�1�A�p.m.C�p.m.�1pm��A�1�A�pmC�p.m.�2a.m.��A�2�A�a.m.C�a.m.�2am��A�2�A�amC�a.m.�2p.m.��A�2�A�p.m.C�p.m.�2pm��A�2�A�pmC�p.m.�3a.m.��A�3�A�a.m.C�a.m.�3am��A�3�A�amC�a.m.�3p.m.��A�3�A�p.m.C�p.m.�3pm��A�3�A�pmC�p.m.�4a.m.��A�4�A�a.m.C�a.m.�4am��A�4�A�amC�a.m.�4p.m.��A�4�A�p.m.C�p.m.�4pm��A�4�A�pmC�p.m.�5a.m.��A�5�A�a.m.C�a.m.�5am��A�5�A�amC�a.m.�5p.m.��A�5�A�p.m.C�p.m.�5pm��A�5�A�pmC�p.m.�6a.m.��A�6�A�a.m.C�a.m.�6am��A�6�A�amC�a.m.�6p.m.��A�6�A�p.m.C�p.m.�6pm��A�6�A�pmC�p.m.�7a.m.��A�7�A�a.m.C�a.m.�7am��A�7�A�amC�a.m.�7p.m.��A�7�A�p.m.C�p.m.�7pm��A�7�A�pmC�p.m.�8)��A�8)�8-)��A�8-)�8-D��A�8-D�8D��A�8D�8a.m.��A�8�A�a.m.C�a.m.�8am��A�8�A�amC�a.m.�8p.m.��A�8�A�p.m.C�p.m.�8pm��A�8�A�pmC�p.m.�9a.m.��A�9�A�a.m.C�a.m.�9am��A�9�A�amC�a.m.�9p.m.��A�9�A�p.m.C�p.m.�9pm��A�9�A�pmC�p.m.�:'(��A�:'(�:')��A�:')�:'-(��A�:'-(�:'-)��A�:'-)�:(��A�:(�:((��A�:((�:(((��A�:(((�:()��A�:()�:)��A�:)�:))��A�:))�:)))��A�:)))�:*��A�:*�:-(��A�:-(�:-((��A�:-((�:-(((��A�:-(((�:-)��A�:-)�:-))��A�:-))�:-)))��A�:-)))�:-*��A�:-*�:-/��A�:-/�:-0��A�:-0�:-3��A�:-3�:->��A�:->�:-D��A�:-D�:-O��A�:-O�:-P��A�:-P�:-X��A�:-X�:-]��A�:-]�:-o��A�:-o�:-p��A�:-p�:-x��A�:-x�:-|��A�:-|�:-}��A�:-}�:/��A�:/�:0��A�:0�:1��A�:1�:3��A�:3�:>��A�:>�:D��A�:D�:O��A�:O�:P��A�:P�:X��A�:X�:]��A�:]�:o��A�:o�:o)��A�:o)�:p��A�:p�:x��A�:x�:|��A�:|�:}��A�:}�:’(��A�:’(�:’)��A�:’)�:’-(��A�:’-(�:’-)��A�:’-)�;)��A�;)�;-)��A�;-)�;-D��A�;-D�;D��A�;D�;_;��A�;_;�<.<��A�<.<�</3��A�</3�<3��A�<3�<33��A�<33�<333��A�<333�<space>��A�<space>�=(��A�=(�=)��A�=)�=/��A�=/�=3��A�=3�=D��A�=D�=[��A�=[�=]��A�=]�=|��A�=|�>.<��A�>.<�>.>��A�>.>�>:(��A�>:(�>:o��A�>:o�><(((*>��A�><(((*>�@_@��A�@_@�C++��A�C++�Dr.��A�Dr.C�doctor�Dra.��A�Dra.C�doctora�O.O��A�O.O�O.o��A�O.o�O_O��A�O_O�O_o��A�O_o�Sr.��A�Sr.C�senyor�Sra.��A�Sra.C�senyora�Srta.��A�Srta.C�senyoreta�St.��A�St.C�sant�Sta.��A�Sta.C�santa�V.V��A�V.V�V_V��A�V_V�XD��A�XD�XDD��A�XDD�[-:��A�[-:�[:��A�[:�[=��A�[=�\")��A�\")�\n��A�\n�\t��A�\t�]=��A�]=�^_^��A�^_^�^__^��A�^__^�^___^��A�^___^�a.��A�a.�abr.��A�abr.C�abril�al��A�a�A�lC�el�als��A�a�A�lsC�els�aprox.��A�aprox.C�aproximadament�b.��A�b.�c.��A�c.�d.��A�d.�dec.��A�dec.C�desembre�del��A�dC�de�A�el�dels��A�dC�de�A�els�e.��A�e.�f.��A�f.�feb.��A�feb.C�febrer�g.��A�g.�gen.��A�gen.C�gener�h.��A�h.�holahola��A�holaholaC�cocacola�i.��A�i.�j.��A�j.�jul.��A�jul.C�juliol�k.��A�k.�l.��A�l.�m.��A�m.�n.��A�n.�nov.��A�nov.C�novembre�núm��A�númC�número�o.��A�o.�o.0��A�o.0�o.O��A�o.O�o.o��A�o.o�o_0��A�o_0�o_O��A�o_O�o_o��A�o_o�oct.��A�oct.C�octubre�p.��A�p.�p.ex.��A�p.ex.C�per exemple�pel��A�pC�per�A�el�pels��A�pC�per�A�els�pl.��A�pl.C�plaça�pàg.��A�pàg.C�pàgina�q.��A�q.�r.��A�r.�s.��A�s.�set.��A�set.C�setembre�t.��A�t.�u.��A�u.�v.��A�v.�v.v��A�v.v�v_v��A�v_v�w.��A�w.�x.��A�x.�xD��A�xD�xDD��A�xDD�y.��A�y.�z.��A�z.� ��A� C� �¯\(ツ)/¯��A�¯\(ツ)/¯�°C.��A�°�A�C�A�.�°F.��A�°�A�F�A�.�°K.��A�°�A�K�A�.�°c.��A�°�A�c�A�.�°f.��A�°�A�f�A�.�°k.��A�°�A�k�A�.�à.��A�à.�ä.��A�ä.�è.��A�è.�é.��A�é.�í.��A�í.�ò.��A�ò.�ó.��A�ó.�ö.��A�ö.�ú.��A�ú.�ü.��A�ü.�ಠ_ಠ��A�ಠ_ಠ�ಠ︵ಠ��A�ಠ︵ಠ�—��A�—�’��A�’�’l��A�’l�’ls��A�’ls�’m��A�’m�’n��A�’n�’ns��A�’ns�’s��A�’s�’t��A�’t�’’��A�’’�faster_heuristics�
transformer/cfg ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ {
2
+ "max_batch_items":4096
3
+ }
transformer/model ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:313a34a754b8d5f772de2ec9b686d4fd59f31b4b954d85e75937fba850f01c41
3
+ size 1425149813
vocab/key2row ADDED
@@ -0,0 +1 @@
 
1
+
vocab/lookups.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76be8b528d0075f7aae98d6fa57a6d3c83ae480a8469e668d7b0af968995ac71
3
+ size 1
vocab/strings.json ADDED
The diff for this file is too large to render. See raw diff
vocab/vectors ADDED
Binary file (128 Bytes). View file
vocab/vectors.cfg ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ {
2
+ "mode":"default"
3
+ }