grosenthal commited on
Commit
d64b580
1 Parent(s): 1de12d7

Upload tokenizer

Browse files
Files changed (4) hide show
  1. special_tokens_map.json +7 -0
  2. tokenizer.json +919 -0
  3. tokenizer_config.json +14 -0
  4. vocab.txt +769 -0
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
@@ -0,0 +1,919 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "[PAD]",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": "[UNK]",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 2,
26
+ "content": "[CLS]",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ },
33
+ {
34
+ "id": 3,
35
+ "content": "[SEP]",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ },
42
+ {
43
+ "id": 4,
44
+ "content": "[MASK]",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ }
51
+ ],
52
+ "normalizer": {
53
+ "type": "BertNormalizer",
54
+ "clean_text": true,
55
+ "handle_chinese_chars": true,
56
+ "strip_accents": null,
57
+ "lowercase": true
58
+ },
59
+ "pre_tokenizer": {
60
+ "type": "BertPreTokenizer"
61
+ },
62
+ "post_processor": {
63
+ "type": "TemplateProcessing",
64
+ "single": [
65
+ {
66
+ "SpecialToken": {
67
+ "id": "[CLS]",
68
+ "type_id": 0
69
+ }
70
+ },
71
+ {
72
+ "Sequence": {
73
+ "id": "A",
74
+ "type_id": 0
75
+ }
76
+ },
77
+ {
78
+ "SpecialToken": {
79
+ "id": "[SEP]",
80
+ "type_id": 0
81
+ }
82
+ }
83
+ ],
84
+ "pair": [
85
+ {
86
+ "SpecialToken": {
87
+ "id": "[CLS]",
88
+ "type_id": 0
89
+ }
90
+ },
91
+ {
92
+ "Sequence": {
93
+ "id": "A",
94
+ "type_id": 0
95
+ }
96
+ },
97
+ {
98
+ "SpecialToken": {
99
+ "id": "[SEP]",
100
+ "type_id": 0
101
+ }
102
+ },
103
+ {
104
+ "Sequence": {
105
+ "id": "B",
106
+ "type_id": 1
107
+ }
108
+ },
109
+ {
110
+ "SpecialToken": {
111
+ "id": "[SEP]",
112
+ "type_id": 1
113
+ }
114
+ }
115
+ ],
116
+ "special_tokens": {
117
+ "[CLS]": {
118
+ "id": "[CLS]",
119
+ "ids": [
120
+ 2
121
+ ],
122
+ "tokens": [
123
+ "[CLS]"
124
+ ]
125
+ },
126
+ "[SEP]": {
127
+ "id": "[SEP]",
128
+ "ids": [
129
+ 3
130
+ ],
131
+ "tokens": [
132
+ "[SEP]"
133
+ ]
134
+ }
135
+ }
136
+ },
137
+ "decoder": {
138
+ "type": "WordPiece",
139
+ "prefix": "##",
140
+ "cleanup": true
141
+ },
142
+ "model": {
143
+ "type": "WordPiece",
144
+ "unk_token": "[UNK]",
145
+ "continuing_subword_prefix": "##",
146
+ "max_input_chars_per_word": 100,
147
+ "vocab": {
148
+ "[PAD]": 0,
149
+ "[UNK]": 1,
150
+ "[CLS]": 2,
151
+ "[SEP]": 3,
152
+ "[MASK]": 4,
153
+ "(": 5,
154
+ ")": 6,
155
+ ",": 7,
156
+ "0": 8,
157
+ "1": 9,
158
+ "2": 10,
159
+ "3": 11,
160
+ "4": 12,
161
+ "5": 13,
162
+ "6": 14,
163
+ "7": 15,
164
+ "8": 16,
165
+ "9": 17,
166
+ "[": 18,
167
+ "]": 19,
168
+ "a": 20,
169
+ "b": 21,
170
+ "c": 22,
171
+ "d": 23,
172
+ "e": 24,
173
+ "f": 25,
174
+ "g": 26,
175
+ "h": 27,
176
+ "i": 28,
177
+ "j": 29,
178
+ "l": 30,
179
+ "m": 31,
180
+ "n": 32,
181
+ "o": 33,
182
+ "p": 34,
183
+ "q": 35,
184
+ "r": 36,
185
+ "s": 37,
186
+ "t": 38,
187
+ "u": 39,
188
+ "v": 40,
189
+ "x": 41,
190
+ "y": 42,
191
+ "##3": 43,
192
+ "##1": 44,
193
+ "##p": 45,
194
+ "##r": 46,
195
+ "##e": 47,
196
+ "##s": 48,
197
+ "##a": 49,
198
+ "##c": 50,
199
+ "##t": 51,
200
+ "##i": 52,
201
+ "##v": 53,
202
+ "##m": 54,
203
+ "##2": 55,
204
+ "##n": 56,
205
+ "##d": 57,
206
+ "##f": 58,
207
+ "##l": 59,
208
+ "##b": 60,
209
+ "##u": 61,
210
+ "##o": 62,
211
+ "##6": 63,
212
+ "##0": 64,
213
+ "##g": 65,
214
+ "##x": 66,
215
+ "##7": 67,
216
+ "##y": 68,
217
+ "##j": 69,
218
+ "##q": 70,
219
+ "##4": 71,
220
+ "##5": 72,
221
+ "##9": 73,
222
+ "##8": 74,
223
+ "##ac": 75,
224
+ "##iv": 76,
225
+ "##ive": 77,
226
+ "##31": 78,
227
+ "##pa": 79,
228
+ "##on": 80,
229
+ "##re": 81,
230
+ "ad": 82,
231
+ "##os": 83,
232
+ "##om": 84,
233
+ "##sm": 85,
234
+ "##act": 86,
235
+ "##pos": 87,
236
+ "##sf": 88,
237
+ "##nom": 89,
238
+ "##acc": 90,
239
+ "##active": 91,
240
+ "##in": 92,
241
+ "##11": 93,
242
+ "##at": 94,
243
+ "##pre": 95,
244
+ "##pres": 96,
245
+ "##en": 97,
246
+ "##er": 98,
247
+ "pr": 99,
248
+ "##gen": 100,
249
+ "##presactive": 101,
250
+ "##ind": 102,
251
+ "##dat": 103,
252
+ "adj": 104,
253
+ "pron": 105,
254
+ "con": 106,
255
+ "n2": 107,
256
+ "vpa": 108,
257
+ "##pp": 109,
258
+ "##ss": 110,
259
+ "vpar": 111,
260
+ "##ppl": 112,
261
+ "conj": 113,
262
+ "n31": 114,
263
+ "##per": 115,
264
+ "##vpos": 116,
265
+ "advpos": 117,
266
+ "v31": 118,
267
+ "##um": 119,
268
+ "##pass": 120,
269
+ "##perf": 121,
270
+ "##passive": 122,
271
+ "##accsf": 123,
272
+ "##ind3": 124,
273
+ "n21": 125,
274
+ "in": 126,
275
+ "##fu": 127,
276
+ "##bl": 128,
277
+ "n11": 129,
278
+ "pre": 130,
279
+ "##sn": 131,
280
+ "##im": 132,
281
+ "##oc": 133,
282
+ "##passiveppl": 134,
283
+ "##pabl": 135,
284
+ "vpar31": 136,
285
+ "prepabl": 137,
286
+ "##32": 138,
287
+ "##sc": 139,
288
+ "##it": 140,
289
+ "##nomsf": 141,
290
+ "##datsm": 142,
291
+ "qu": 143,
292
+ "##pm": 144,
293
+ "##2s": 145,
294
+ "##li": 146,
295
+ "##nomsm": 147,
296
+ "adj11": 148,
297
+ "v31presactive": 149,
298
+ "##perfpassiveppl": 150,
299
+ "##ind3p": 151,
300
+ "##loc": 152,
301
+ "##or": 153,
302
+ "##61": 154,
303
+ "##fut": 155,
304
+ "n3": 156,
305
+ "##10": 157,
306
+ "##si": 158,
307
+ "##ar": 159,
308
+ "##ll": 160,
309
+ "##accsm": 161,
310
+ "##gensm": 162,
311
+ "pron10": 163,
312
+ "##perfactive": 164,
313
+ "et": 165,
314
+ "ex": 166,
315
+ "num": 167,
316
+ "vi": 168,
317
+ "##1presactive": 169,
318
+ "##pf": 170,
319
+ "##p2s": 171,
320
+ "##sx": 172,
321
+ "##nomsn": 173,
322
+ "##accsc": 174,
323
+ "##gensf": 175,
324
+ "##presactiveppl": 176,
325
+ "adj32": 177,
326
+ "n31accsf": 178,
327
+ "##ind3s": 179,
328
+ "##imp2s": 180,
329
+ "an": 181,
330
+ "ca": 182,
331
+ "cum": 183,
332
+ "ill": 184,
333
+ "pu": 185,
334
+ "##pe": 186,
335
+ "##px": 187,
336
+ "##st": 188,
337
+ "##te": 189,
338
+ "##41": 190,
339
+ "pron61": 191,
340
+ "n21datsm": 192,
341
+ "n33": 193,
342
+ "di": 194,
343
+ "se": 195,
344
+ "v11": 196,
345
+ "##su": 197,
346
+ "##al": 198,
347
+ "##tu": 199,
348
+ "##il": 200,
349
+ "##lv": 201,
350
+ "##ur": 202,
351
+ "##xx": 203,
352
+ "##qu": 204,
353
+ "##gensn": 205,
354
+ "##datpx": 206,
355
+ "adj1": 207,
356
+ "pron41": 208,
357
+ "n22": 209,
358
+ "vpar11": 210,
359
+ "n31loc": 211,
360
+ "v31perfactive": 212,
361
+ "n21accsm": 213,
362
+ "n11accsf": 214,
363
+ "n11nomsf": 215,
364
+ "n11gensf": 216,
365
+ "##futactive": 217,
366
+ "expe": 218,
367
+ "##accscpos": 219,
368
+ "au": 220,
369
+ "ali": 221,
370
+ "mor": 222,
371
+ "n9": 223,
372
+ "non": 224,
373
+ "si": 225,
374
+ "so": 226,
375
+ "un": 227,
376
+ "v2": 228,
377
+ "v61": 229,
378
+ "##pi": 230,
379
+ "##rtu": 231,
380
+ "##el": 232,
381
+ "##ct": 233,
382
+ "##ir": 234,
383
+ "##di": 235,
384
+ "##bil": 236,
385
+ "##un": 237,
386
+ "##8xx": 238,
387
+ "##nompm": 239,
388
+ "##accpf": 240,
389
+ "##inf": 241,
390
+ "##prespassive": 242,
391
+ "##ind2s": 243,
392
+ "##datsx": 244,
393
+ "n21gensm": 245,
394
+ "##itat": 246,
395
+ "##datsmor": 247,
396
+ "que": 248,
397
+ "##nomsmpos": 249,
398
+ "##nomsmperfpassiveppl": 250,
399
+ "v31presactiveind3p": 251,
400
+ "##futpassiveppl": 252,
401
+ "##sibil": 253,
402
+ "virtu": 254,
403
+ "##1presactiveimp2s": 255,
404
+ "adj32accscpos": 256,
405
+ "##sub": 257,
406
+ "expet": 258,
407
+ "n98xx": 259,
408
+ "v21presactiveimp2s": 260,
409
+ "##datsmord": 261,
410
+ "virtut": 262,
411
+ "n98xxm": 263,
412
+ "cl": 264,
413
+ "co": 265,
414
+ "cre": 266,
415
+ "de": 267,
416
+ "dom": 268,
417
+ "en": 269,
418
+ "ef": 270,
419
+ "lact": 271,
420
+ "ne": 272,
421
+ "n32": 273,
422
+ "sa": 274,
423
+ "su": 275,
424
+ "tre": 276,
425
+ "ter": 277,
426
+ "tur": 278,
427
+ "va": 279,
428
+ "v7": 280,
429
+ "v5": 281,
430
+ "##3p": 282,
431
+ "##34": 283,
432
+ "##1s": 284,
433
+ "##pc": 285,
434
+ "##ru": 286,
435
+ "##ef": 287,
436
+ "##eli": 288,
437
+ "##ear": 289,
438
+ "##sim": 290,
439
+ "##av": 291,
440
+ "##ab": 292,
441
+ "##abl": 293,
442
+ "##com": 294,
443
+ "##ter": 295,
444
+ "##is": 296,
445
+ "##voc": 297,
446
+ "##20": 298,
447
+ "##ly": 299,
448
+ "##0x": 300,
449
+ "##ge": 301,
450
+ "##gn": 302,
451
+ "##4nomsn": 303,
452
+ "##5nomsmpos": 304,
453
+ "##ivir": 305,
454
+ "##nomsc": 306,
455
+ "##nompc": 307,
456
+ "##accpm": 308,
457
+ "##inos": 309,
458
+ "##inar": 310,
459
+ "##ati": 311,
460
+ "##eni": 312,
461
+ "pro": 313,
462
+ "##gensx": 314,
463
+ "##datsn": 315,
464
+ "pron31": 316,
465
+ "vpar34": 317,
466
+ "n31nomsf": 318,
467
+ "n31nomsm": 319,
468
+ "n31gensf": 320,
469
+ "##accsfpos": 321,
470
+ "inv": 322,
471
+ "##fug": 323,
472
+ "##fusi": 324,
473
+ "vpar31datsm": 325,
474
+ "vpar31datpx": 326,
475
+ "vpar31accpf": 327,
476
+ "vpar31nomsmperfpassiveppl": 328,
477
+ "adj11gensm": 329,
478
+ "adj11nomsn": 330,
479
+ "v31presactiveind": 331,
480
+ "v31presactiveimp2s": 332,
481
+ "n34nomsn": 333,
482
+ "pron10nompm": 334,
483
+ "numer": 335,
484
+ "num20": 336,
485
+ "visibil": 337,
486
+ "##1presactiveind3p": 338,
487
+ "adj32nomsc": 339,
488
+ "anim": 340,
489
+ "ante": 341,
490
+ "cael": 342,
491
+ "pull": 343,
492
+ "pulv": 344,
493
+ "##str": 345,
494
+ "pron61datsx": 346,
495
+ "n33nomsf": 347,
496
+ "n33loc": 348,
497
+ "dix": 349,
498
+ "sed": 350,
499
+ "v11prespassive": 351,
500
+ "##que": 352,
501
+ "adj13": 353,
502
+ "adj15nomsmpos": 354,
503
+ "pron41gensx": 355,
504
+ "n22gensn": 356,
505
+ "n22datsn": 357,
506
+ "n31locpm": 358,
507
+ "mort": 359,
508
+ "sign": 360,
509
+ "solv": 361,
510
+ "##und": 362,
511
+ "##inf0x": 363,
512
+ "##sub3p": 364,
513
+ "domin": 365,
514
+ "enim": 366,
515
+ "n32gensn": 367,
516
+ "terr": 368,
517
+ "v51presactiveind3p": 369,
518
+ "##elic": 370,
519
+ "##early": 371,
520
+ "##comp": 372,
521
+ "##vocsm": 373,
522
+ "##nompcpresactiveppl": 374,
523
+ "vpar31datpxpresactiveppl": 375,
524
+ "vpar31accpfperfpassiveppl": 376,
525
+ "adj11gensmpos": 377,
526
+ "num20datsmord": 378,
527
+ "adj32nomscpos": 379,
528
+ "pulvinar": 380,
529
+ "3r": 381,
530
+ "ar": 382,
531
+ "ae": 383,
532
+ "at": 384,
533
+ "ab": 385,
534
+ "bivir": 386,
535
+ "cu": 387,
536
+ "cen": 388,
537
+ "car": 389,
538
+ "cur": 390,
539
+ "cir": 391,
540
+ "cru": 392,
541
+ "da": 393,
542
+ "dum": 394,
543
+ "er": 395,
544
+ "es": 396,
545
+ "el": 397,
546
+ "eg": 398,
547
+ "ess": 399,
548
+ "equ": 400,
549
+ "fi": 401,
550
+ "fu": 402,
551
+ "fac": 403,
552
+ "fund": 404,
553
+ "felic": 405,
554
+ "ho": 406,
555
+ "ip": 407,
556
+ "ir": 408,
557
+ "im": 409,
558
+ "iu": 410,
559
+ "le": 411,
560
+ "lon": 412,
561
+ "lat": 413,
562
+ "lum": 414,
563
+ "loc": 415,
564
+ "ma": 416,
565
+ "mo": 417,
566
+ "min": 418,
567
+ "ni": 419,
568
+ "nat": 420,
569
+ "nun": 421,
570
+ "nav": 422,
571
+ "of": 423,
572
+ "ob": 424,
573
+ "oper": 425,
574
+ "par": 426,
575
+ "rab": 427,
576
+ "rati": 428,
577
+ "spe": 429,
578
+ "sal": 430,
579
+ "sur": 431,
580
+ "tu": 432,
581
+ "to": 433,
582
+ "ur": 434,
583
+ "ve": 435,
584
+ "vac": 436,
585
+ "viv": 437,
586
+ "voc": 438,
587
+ "v32": 439,
588
+ "vit": 440,
589
+ "v41": 441,
590
+ "vel": 442,
591
+ "veni": 443,
592
+ "xxx": 444,
593
+ "##3presactive": 445,
594
+ "##1p": 446,
595
+ "##12": 447,
596
+ "##1nom": 448,
597
+ "##1abl": 449,
598
+ "##pt": 450,
599
+ "##pon": 451,
600
+ "##pacc": 452,
601
+ "##et": 453,
602
+ "##em": 454,
603
+ "##ed": 455,
604
+ "##eo": 456,
605
+ "##ex": 457,
606
+ "##ect": 458,
607
+ "##sv": 459,
608
+ "##spos": 460,
609
+ "##spi": 461,
610
+ "##an": 462,
611
+ "##ass": 463,
612
+ "##aef": 464,
613
+ "##age": 465,
614
+ "##ci": 466,
615
+ "##cum": 467,
616
+ "##car": 468,
617
+ "##cund": 469,
618
+ "##tr": 470,
619
+ "##til": 471,
620
+ "##ic": 472,
621
+ "##isibil": 473,
622
+ "##mat": 474,
623
+ "##mef": 475,
624
+ "##2p": 476,
625
+ "##2nomsm": 477,
626
+ "##21nom": 478,
627
+ "##nct": 479,
628
+ "##nis": 480,
629
+ "##dx": 481,
630
+ "##delic": 482,
631
+ "##dex": 483,
632
+ "##fen": 484,
633
+ "##fect": 485,
634
+ "##fan": 486,
635
+ "##lum": 487,
636
+ "##ul": 488,
637
+ "##usv": 489,
638
+ "##62nomsm": 490,
639
+ "##gi": 491,
640
+ "##gy": 492,
641
+ "##gli": 493,
642
+ "##ginos": 494,
643
+ "##xage": 495,
644
+ "##51abl": 496,
645
+ "##ivi": 497,
646
+ "##31accscpos": 498,
647
+ "##patr": 499,
648
+ "##req": 500,
649
+ "adtu": 501,
650
+ "##smcar": 502,
651
+ "##posinf": 503,
652
+ "##sfearly": 504,
653
+ "##nompf": 505,
654
+ "##inx": 506,
655
+ "##11abl": 507,
656
+ "##press": 508,
657
+ "##presind3s": 509,
658
+ "praef": 510,
659
+ "##genpm": 511,
660
+ "##genpf": 512,
661
+ "##genpx": 513,
662
+ "##genter": 514,
663
+ "##presactiveind3s": 515,
664
+ "##ind1s": 516,
665
+ "##datsf": 517,
666
+ "adj31accscpos": 518,
667
+ "pron62nomsm": 519,
668
+ "pron51abl": 520,
669
+ "consu": 521,
670
+ "##sser": 522,
671
+ "vpar32": 523,
672
+ "vpar21nom": 524,
673
+ "n31accsm": 525,
674
+ "v31futactive": 526,
675
+ "v31prespassive": 527,
676
+ "v31presind3s": 528,
677
+ "##ump": 529,
678
+ "##passiveind3p": 530,
679
+ "##accsffutpassiveppl": 531,
680
+ "n21loc": 532,
681
+ "n21vocsm": 533,
682
+ "n21datsf": 534,
683
+ "inter": 535,
684
+ "infusi": 536,
685
+ "index": 537,
686
+ "infan": 538,
687
+ "##fus": 539,
688
+ "prepacc": 540,
689
+ "vpar31gensm": 541,
690
+ "vpar31vocsm": 542,
691
+ "vpar31nompcpresactiveppl": 543,
692
+ "##scul": 544,
693
+ "##iter": 545,
694
+ "##itusv": 546,
695
+ "##nomsfpos": 547,
696
+ "##liginos": 548,
697
+ "adj11accsc": 549,
698
+ "adj11nomsmpos": 550,
699
+ "adj11accsfpos": 551,
700
+ "adj11genpm": 552,
701
+ "adj11nomsfpos": 553,
702
+ "v31presactiveind3s": 554,
703
+ "v31presactiveinf0x": 555,
704
+ "##lociter": 556,
705
+ "##oritat": 557,
706
+ "##futpassiveind3p": 558,
707
+ "##sili": 559,
708
+ "##gensmfutpassiveppl": 560,
709
+ "pron10accsf": 561,
710
+ "pron10nomsf": 562,
711
+ "pron10accsm": 563,
712
+ "pron10nomsn": 564,
713
+ "pron10nompf": 565,
714
+ "##perfactiveind3s": 566,
715
+ "##perfactiveind2s": 567,
716
+ "##perfactivesub3p": 568,
717
+ "exiv": 569,
718
+ "exsili": 570,
719
+ "num12": 571,
720
+ "num11abl": 572,
721
+ "videlic": 573,
722
+ "##1presactiveind3s": 574,
723
+ "##sxpresactiveppl": 575,
724
+ "##accscpresactiveppl": 576,
725
+ "adj32genpx": 577,
726
+ "ann": 578,
727
+ "castr": 579,
728
+ "caed": 580,
729
+ "caliginos": 581,
730
+ "put": 582,
731
+ "##stin": 583,
732
+ "##tem": 584,
733
+ "##tere": 585,
734
+ "##tesim": 586,
735
+ "pron61accsf": 587,
736
+ "pron61datpx": 588,
737
+ "pron61accpm": 589,
738
+ "n33genpf": 590,
739
+ "dige": 591,
740
+ "dispos": 592,
741
+ "secund": 593,
742
+ "sexage": 594,
743
+ "v11futactive": 595,
744
+ "v11perfactiveind2s": 596,
745
+ "##alitat": 597,
746
+ "pron41accsm": 598,
747
+ "pron41datpx": 599,
748
+ "vpar11accpf": 600,
749
+ "vpar11accpm": 601,
750
+ "vpar11gensmfutpassiveppl": 602,
751
+ "vpar11accscpresactiveppl": 603,
752
+ "n31locsm": 604,
753
+ "n31locsfearly": 605,
754
+ "v31perfactiveind3p": 606,
755
+ "v31perfactiveind3s": 607,
756
+ "v31perfactiveind2s": 608,
757
+ "v31perfactivesub3p": 609,
758
+ "##futactiveppl": 610,
759
+ "##futactiveind1s": 611,
760
+ "expetere": 612,
761
+ "auct": 613,
762
+ "aufug": 614,
763
+ "autem": 615,
764
+ "aliqu": 616,
765
+ "sol": 617,
766
+ "undi": 618,
767
+ "univir": 619,
768
+ "v61presactiveind3s": 620,
769
+ "v61perfactiveind3s": 621,
770
+ "v61futactiveind1s": 622,
771
+ "##pid": 623,
772
+ "##die": 624,
773
+ "##dic": 625,
774
+ "##ind2searly": 626,
775
+ "##datsxposinf": 627,
776
+ "##sub1s": 628,
777
+ "expeto": 629,
778
+ "expetivi": 630,
779
+ "expetitusv": 631,
780
+ "cleo": 632,
781
+ "class": 633,
782
+ "colum": 634,
783
+ "codic": 635,
784
+ "cred": 636,
785
+ "creat": 637,
786
+ "effug": 638,
787
+ "effusi": 639,
788
+ "nec": 640,
789
+ "negli": 641,
790
+ "sapi": 642,
791
+ "sanct": 643,
792
+ "suspi": 644,
793
+ "sustin": 645,
794
+ "tremef": 646,
795
+ "trepid": 647,
796
+ "turp": 648,
797
+ "turb": 649,
798
+ "vas": 650,
799
+ "vascul": 651,
800
+ "v73presactive": 652,
801
+ "v71presactiveind3s": 653,
802
+ "##atio": 654,
803
+ "profect": 655,
804
+ "pron31nomsn": 656,
805
+ "pron31nompm": 657,
806
+ "vpar34nomsmperfpassiveppl": 658,
807
+ "vpar34nompcpresactiveppl": 659,
808
+ "inveni": 660,
809
+ "invisibil": 661,
810
+ "vpar31datsmperfpassiveppl": 662,
811
+ "vpar31datsmfutpassiveppl": 663,
812
+ "adj11nomsnpos": 664,
813
+ "adj11nomsncomp": 665,
814
+ "v31presactiveind1p": 666,
815
+ "v31presactiveind2p": 667,
816
+ "antepon": 668,
817
+ "##strinx": 669,
818
+ "n33locsf": 670,
819
+ "n33locpf": 671,
820
+ "v11prespassiveinf0x": 672,
821
+ "v11prespassivesub1s": 673,
822
+ "adj13accsfpos": 674,
823
+ "adj13datsxposinf": 675,
824
+ "mortalitat": 676,
825
+ "dominic": 677,
826
+ "3rd": 678,
827
+ "armat": 679,
828
+ "aegy": 680,
829
+ "atque": 681,
830
+ "cui": 682,
831
+ "centesim": 683,
832
+ "carnis": 684,
833
+ "curs": 685,
834
+ "circum": 686,
835
+ "cruc": 687,
836
+ "daem": 688,
837
+ "erump": 689,
838
+ "elab": 690,
839
+ "equit": 691,
840
+ "fili": 692,
841
+ "fug": 693,
842
+ "faci": 694,
843
+ "felicitat": 695,
844
+ "hodie": 696,
845
+ "ips": 697,
846
+ "irru": 698,
847
+ "impress": 699,
848
+ "iust": 700,
849
+ "lesser": 701,
850
+ "longi": 702,
851
+ "latit": 703,
852
+ "luminos": 704,
853
+ "mai": 705,
854
+ "mod": 706,
855
+ "minor": 707,
856
+ "nisi": 708,
857
+ "natal": 709,
858
+ "nunc": 710,
859
+ "offen": 711,
860
+ "obstrinx": 712,
861
+ "operatio": 713,
862
+ "parit": 714,
863
+ "ration": 715,
864
+ "speci": 716,
865
+ "surg": 717,
866
+ "tot": 718,
867
+ "urb": 719,
868
+ "velociter": 720,
869
+ "vacu": 721,
870
+ "v32perfactivesub3p": 722,
871
+ "v41futpassiveind3p": 723,
872
+ "xxxdx": 724,
873
+ "adtul": 725,
874
+ "##smcard": 726,
875
+ "praefer": 727,
876
+ "pron51ablsc": 728,
877
+ "consul": 729,
878
+ "vpar32accsffutpassiveppl": 730,
879
+ "vpar21nomsxpresactiveppl": 731,
880
+ "v31futactiveind3p": 732,
881
+ "v31prespassiveind3p": 733,
882
+ "n21locpm": 734,
883
+ "infusion": 735,
884
+ "infantil": 736,
885
+ "vpar31gensmperfpassiveppl": 737,
886
+ "vpar31vocsmperfpassiveppl": 738,
887
+ "adj11accsccomp": 739,
888
+ "adj11genpmpos": 740,
889
+ "num12datsmord": 741,
890
+ "num11ablsmcard": 742,
891
+ "videlicet": 743,
892
+ "adj32genpxpos": 744,
893
+ "digest": 745,
894
+ "disposit": 746,
895
+ "sexagesim": 747,
896
+ "v11futactiveimp2s": 748,
897
+ "vpar11accpffutactiveppl": 749,
898
+ "vpar11accpmperfpassiveppl": 750,
899
+ "auctoritat": 751,
900
+ "undique": 752,
901
+ "cleopatr": 753,
902
+ "classis": 754,
903
+ "columb": 755,
904
+ "effugav": 756,
905
+ "effusio": 757,
906
+ "negligenter": 758,
907
+ "suspic": 759,
908
+ "tremefact": 760,
909
+ "v73presactiveind2searly": 761,
910
+ "profecto": 762,
911
+ "adj13datsxposinfreq": 763,
912
+ "aegypt": 764,
913
+ "circumfus": 765,
914
+ "daemon": 766,
915
+ "offend": 767,
916
+ "special": 768
917
+ }
918
+ }
919
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "do_lower_case": true,
4
+ "mask_token": "[MASK]",
5
+ "model_max_length": 512,
6
+ "name_or_path": "bert-base-uncased",
7
+ "pad_token": "[PAD]",
8
+ "sep_token": "[SEP]",
9
+ "special_tokens_map_file": null,
10
+ "strip_accents": null,
11
+ "tokenize_chinese_chars": true,
12
+ "tokenizer_class": "BertTokenizer",
13
+ "unk_token": "[UNK]"
14
+ }
vocab.txt ADDED
@@ -0,0 +1,769 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [PAD]
2
+ [UNK]
3
+ [CLS]
4
+ [SEP]
5
+ [MASK]
6
+ (
7
+ )
8
+ ,
9
+ 0
10
+ 1
11
+ 2
12
+ 3
13
+ 4
14
+ 5
15
+ 6
16
+ 7
17
+ 8
18
+ 9
19
+ [
20
+ ]
21
+ a
22
+ b
23
+ c
24
+ d
25
+ e
26
+ f
27
+ g
28
+ h
29
+ i
30
+ j
31
+ l
32
+ m
33
+ n
34
+ o
35
+ p
36
+ q
37
+ r
38
+ s
39
+ t
40
+ u
41
+ v
42
+ x
43
+ y
44
+ ##3
45
+ ##1
46
+ ##p
47
+ ##r
48
+ ##e
49
+ ##s
50
+ ##a
51
+ ##c
52
+ ##t
53
+ ##i
54
+ ##v
55
+ ##m
56
+ ##2
57
+ ##n
58
+ ##d
59
+ ##f
60
+ ##l
61
+ ##b
62
+ ##u
63
+ ##o
64
+ ##6
65
+ ##0
66
+ ##g
67
+ ##x
68
+ ##7
69
+ ##y
70
+ ##j
71
+ ##q
72
+ ##4
73
+ ##5
74
+ ##9
75
+ ##8
76
+ ##ac
77
+ ##iv
78
+ ##ive
79
+ ##31
80
+ ##pa
81
+ ##on
82
+ ##re
83
+ ad
84
+ ##os
85
+ ##om
86
+ ##sm
87
+ ##act
88
+ ##pos
89
+ ##sf
90
+ ##nom
91
+ ##acc
92
+ ##active
93
+ ##in
94
+ ##11
95
+ ##at
96
+ ##pre
97
+ ##pres
98
+ ##en
99
+ ##er
100
+ pr
101
+ ##gen
102
+ ##presactive
103
+ ##ind
104
+ ##dat
105
+ adj
106
+ pron
107
+ con
108
+ n2
109
+ vpa
110
+ ##pp
111
+ ##ss
112
+ vpar
113
+ ##ppl
114
+ conj
115
+ n31
116
+ ##per
117
+ ##vpos
118
+ advpos
119
+ v31
120
+ ##um
121
+ ##pass
122
+ ##perf
123
+ ##passive
124
+ ##accsf
125
+ ##ind3
126
+ n21
127
+ in
128
+ ##fu
129
+ ##bl
130
+ n11
131
+ pre
132
+ ##sn
133
+ ##im
134
+ ##oc
135
+ ##passiveppl
136
+ ##pabl
137
+ vpar31
138
+ prepabl
139
+ ##32
140
+ ##sc
141
+ ##it
142
+ ##nomsf
143
+ ##datsm
144
+ qu
145
+ ##pm
146
+ ##2s
147
+ ##li
148
+ ##nomsm
149
+ adj11
150
+ v31presactive
151
+ ##perfpassiveppl
152
+ ##ind3p
153
+ ##loc
154
+ ##or
155
+ ##61
156
+ ##fut
157
+ n3
158
+ ##10
159
+ ##si
160
+ ##ar
161
+ ##ll
162
+ ##accsm
163
+ ##gensm
164
+ pron10
165
+ ##perfactive
166
+ et
167
+ ex
168
+ num
169
+ vi
170
+ ##1presactive
171
+ ##pf
172
+ ##p2s
173
+ ##sx
174
+ ##nomsn
175
+ ##accsc
176
+ ##gensf
177
+ ##presactiveppl
178
+ adj32
179
+ n31accsf
180
+ ##ind3s
181
+ ##imp2s
182
+ an
183
+ ca
184
+ cum
185
+ ill
186
+ pu
187
+ ##pe
188
+ ##px
189
+ ##st
190
+ ##te
191
+ ##41
192
+ pron61
193
+ n21datsm
194
+ n33
195
+ di
196
+ se
197
+ v11
198
+ ##su
199
+ ##al
200
+ ##tu
201
+ ##il
202
+ ##lv
203
+ ##ur
204
+ ##xx
205
+ ##qu
206
+ ##gensn
207
+ ##datpx
208
+ adj1
209
+ pron41
210
+ n22
211
+ vpar11
212
+ n31loc
213
+ v31perfactive
214
+ n21accsm
215
+ n11accsf
216
+ n11nomsf
217
+ n11gensf
218
+ ##futactive
219
+ expe
220
+ ##accscpos
221
+ au
222
+ ali
223
+ mor
224
+ n9
225
+ non
226
+ si
227
+ so
228
+ un
229
+ v2
230
+ v61
231
+ ##pi
232
+ ##rtu
233
+ ##el
234
+ ##ct
235
+ ##ir
236
+ ##di
237
+ ##bil
238
+ ##un
239
+ ##8xx
240
+ ##nompm
241
+ ##accpf
242
+ ##inf
243
+ ##prespassive
244
+ ##ind2s
245
+ ##datsx
246
+ n21gensm
247
+ ##itat
248
+ ##datsmor
249
+ que
250
+ ##nomsmpos
251
+ ##nomsmperfpassiveppl
252
+ v31presactiveind3p
253
+ ##futpassiveppl
254
+ ##sibil
255
+ virtu
256
+ ##1presactiveimp2s
257
+ adj32accscpos
258
+ ##sub
259
+ expet
260
+ n98xx
261
+ v21presactiveimp2s
262
+ ##datsmord
263
+ virtut
264
+ n98xxm
265
+ cl
266
+ co
267
+ cre
268
+ de
269
+ dom
270
+ en
271
+ ef
272
+ lact
273
+ ne
274
+ n32
275
+ sa
276
+ su
277
+ tre
278
+ ter
279
+ tur
280
+ va
281
+ v7
282
+ v5
283
+ ##3p
284
+ ##34
285
+ ##1s
286
+ ##pc
287
+ ##ru
288
+ ##ef
289
+ ##eli
290
+ ##ear
291
+ ##sim
292
+ ##av
293
+ ##ab
294
+ ##abl
295
+ ##com
296
+ ##ter
297
+ ##is
298
+ ##voc
299
+ ##20
300
+ ##ly
301
+ ##0x
302
+ ##ge
303
+ ##gn
304
+ ##4nomsn
305
+ ##5nomsmpos
306
+ ##ivir
307
+ ##nomsc
308
+ ##nompc
309
+ ##accpm
310
+ ##inos
311
+ ##inar
312
+ ##ati
313
+ ##eni
314
+ pro
315
+ ##gensx
316
+ ##datsn
317
+ pron31
318
+ vpar34
319
+ n31nomsf
320
+ n31nomsm
321
+ n31gensf
322
+ ##accsfpos
323
+ inv
324
+ ##fug
325
+ ##fusi
326
+ vpar31datsm
327
+ vpar31datpx
328
+ vpar31accpf
329
+ vpar31nomsmperfpassiveppl
330
+ adj11gensm
331
+ adj11nomsn
332
+ v31presactiveind
333
+ v31presactiveimp2s
334
+ n34nomsn
335
+ pron10nompm
336
+ numer
337
+ num20
338
+ visibil
339
+ ##1presactiveind3p
340
+ adj32nomsc
341
+ anim
342
+ ante
343
+ cael
344
+ pull
345
+ pulv
346
+ ##str
347
+ pron61datsx
348
+ n33nomsf
349
+ n33loc
350
+ dix
351
+ sed
352
+ v11prespassive
353
+ ##que
354
+ adj13
355
+ adj15nomsmpos
356
+ pron41gensx
357
+ n22gensn
358
+ n22datsn
359
+ n31locpm
360
+ mort
361
+ sign
362
+ solv
363
+ ##und
364
+ ##inf0x
365
+ ##sub3p
366
+ domin
367
+ enim
368
+ n32gensn
369
+ terr
370
+ v51presactiveind3p
371
+ ##elic
372
+ ##early
373
+ ##comp
374
+ ##vocsm
375
+ ##nompcpresactiveppl
376
+ vpar31datpxpresactiveppl
377
+ vpar31accpfperfpassiveppl
378
+ adj11gensmpos
379
+ num20datsmord
380
+ adj32nomscpos
381
+ pulvinar
382
+ 3r
383
+ ar
384
+ ae
385
+ at
386
+ ab
387
+ bivir
388
+ cu
389
+ cen
390
+ car
391
+ cur
392
+ cir
393
+ cru
394
+ da
395
+ dum
396
+ er
397
+ es
398
+ el
399
+ eg
400
+ ess
401
+ equ
402
+ fi
403
+ fu
404
+ fac
405
+ fund
406
+ felic
407
+ ho
408
+ ip
409
+ ir
410
+ im
411
+ iu
412
+ le
413
+ lon
414
+ lat
415
+ lum
416
+ loc
417
+ ma
418
+ mo
419
+ min
420
+ ni
421
+ nat
422
+ nun
423
+ nav
424
+ of
425
+ ob
426
+ oper
427
+ par
428
+ rab
429
+ rati
430
+ spe
431
+ sal
432
+ sur
433
+ tu
434
+ to
435
+ ur
436
+ ve
437
+ vac
438
+ viv
439
+ voc
440
+ v32
441
+ vit
442
+ v41
443
+ vel
444
+ veni
445
+ xxx
446
+ ##3presactive
447
+ ##1p
448
+ ##12
449
+ ##1nom
450
+ ##1abl
451
+ ##pt
452
+ ##pon
453
+ ##pacc
454
+ ##et
455
+ ##em
456
+ ##ed
457
+ ##eo
458
+ ##ex
459
+ ##ect
460
+ ##sv
461
+ ##spos
462
+ ##spi
463
+ ##an
464
+ ##ass
465
+ ##aef
466
+ ##age
467
+ ##ci
468
+ ##cum
469
+ ##car
470
+ ##cund
471
+ ##tr
472
+ ##til
473
+ ##ic
474
+ ##isibil
475
+ ##mat
476
+ ##mef
477
+ ##2p
478
+ ##2nomsm
479
+ ##21nom
480
+ ##nct
481
+ ##nis
482
+ ##dx
483
+ ##delic
484
+ ##dex
485
+ ##fen
486
+ ##fect
487
+ ##fan
488
+ ##lum
489
+ ##ul
490
+ ##usv
491
+ ##62nomsm
492
+ ##gi
493
+ ##gy
494
+ ##gli
495
+ ##ginos
496
+ ##xage
497
+ ##51abl
498
+ ##ivi
499
+ ##31accscpos
500
+ ##patr
501
+ ##req
502
+ adtu
503
+ ##smcar
504
+ ##posinf
505
+ ##sfearly
506
+ ##nompf
507
+ ##inx
508
+ ##11abl
509
+ ##press
510
+ ##presind3s
511
+ praef
512
+ ##genpm
513
+ ##genpf
514
+ ##genpx
515
+ ##genter
516
+ ##presactiveind3s
517
+ ##ind1s
518
+ ##datsf
519
+ adj31accscpos
520
+ pron62nomsm
521
+ pron51abl
522
+ consu
523
+ ##sser
524
+ vpar32
525
+ vpar21nom
526
+ n31accsm
527
+ v31futactive
528
+ v31prespassive
529
+ v31presind3s
530
+ ##ump
531
+ ##passiveind3p
532
+ ##accsffutpassiveppl
533
+ n21loc
534
+ n21vocsm
535
+ n21datsf
536
+ inter
537
+ infusi
538
+ index
539
+ infan
540
+ ##fus
541
+ prepacc
542
+ vpar31gensm
543
+ vpar31vocsm
544
+ vpar31nompcpresactiveppl
545
+ ##scul
546
+ ##iter
547
+ ##itusv
548
+ ##nomsfpos
549
+ ##liginos
550
+ adj11accsc
551
+ adj11nomsmpos
552
+ adj11accsfpos
553
+ adj11genpm
554
+ adj11nomsfpos
555
+ v31presactiveind3s
556
+ v31presactiveinf0x
557
+ ##lociter
558
+ ##oritat
559
+ ##futpassiveind3p
560
+ ##sili
561
+ ##gensmfutpassiveppl
562
+ pron10accsf
563
+ pron10nomsf
564
+ pron10accsm
565
+ pron10nomsn
566
+ pron10nompf
567
+ ##perfactiveind3s
568
+ ##perfactiveind2s
569
+ ##perfactivesub3p
570
+ exiv
571
+ exsili
572
+ num12
573
+ num11abl
574
+ videlic
575
+ ##1presactiveind3s
576
+ ##sxpresactiveppl
577
+ ##accscpresactiveppl
578
+ adj32genpx
579
+ ann
580
+ castr
581
+ caed
582
+ caliginos
583
+ put
584
+ ##stin
585
+ ##tem
586
+ ##tere
587
+ ##tesim
588
+ pron61accsf
589
+ pron61datpx
590
+ pron61accpm
591
+ n33genpf
592
+ dige
593
+ dispos
594
+ secund
595
+ sexage
596
+ v11futactive
597
+ v11perfactiveind2s
598
+ ##alitat
599
+ pron41accsm
600
+ pron41datpx
601
+ vpar11accpf
602
+ vpar11accpm
603
+ vpar11gensmfutpassiveppl
604
+ vpar11accscpresactiveppl
605
+ n31locsm
606
+ n31locsfearly
607
+ v31perfactiveind3p
608
+ v31perfactiveind3s
609
+ v31perfactiveind2s
610
+ v31perfactivesub3p
611
+ ##futactiveppl
612
+ ##futactiveind1s
613
+ expetere
614
+ auct
615
+ aufug
616
+ autem
617
+ aliqu
618
+ sol
619
+ undi
620
+ univir
621
+ v61presactiveind3s
622
+ v61perfactiveind3s
623
+ v61futactiveind1s
624
+ ##pid
625
+ ##die
626
+ ##dic
627
+ ##ind2searly
628
+ ##datsxposinf
629
+ ##sub1s
630
+ expeto
631
+ expetivi
632
+ expetitusv
633
+ cleo
634
+ class
635
+ colum
636
+ codic
637
+ cred
638
+ creat
639
+ effug
640
+ effusi
641
+ nec
642
+ negli
643
+ sapi
644
+ sanct
645
+ suspi
646
+ sustin
647
+ tremef
648
+ trepid
649
+ turp
650
+ turb
651
+ vas
652
+ vascul
653
+ v73presactive
654
+ v71presactiveind3s
655
+ ##atio
656
+ profect
657
+ pron31nomsn
658
+ pron31nompm
659
+ vpar34nomsmperfpassiveppl
660
+ vpar34nompcpresactiveppl
661
+ inveni
662
+ invisibil
663
+ vpar31datsmperfpassiveppl
664
+ vpar31datsmfutpassiveppl
665
+ adj11nomsnpos
666
+ adj11nomsncomp
667
+ v31presactiveind1p
668
+ v31presactiveind2p
669
+ antepon
670
+ ##strinx
671
+ n33locsf
672
+ n33locpf
673
+ v11prespassiveinf0x
674
+ v11prespassivesub1s
675
+ adj13accsfpos
676
+ adj13datsxposinf
677
+ mortalitat
678
+ dominic
679
+ 3rd
680
+ armat
681
+ aegy
682
+ atque
683
+ cui
684
+ centesim
685
+ carnis
686
+ curs
687
+ circum
688
+ cruc
689
+ daem
690
+ erump
691
+ elab
692
+ equit
693
+ fili
694
+ fug
695
+ faci
696
+ felicitat
697
+ hodie
698
+ ips
699
+ irru
700
+ impress
701
+ iust
702
+ lesser
703
+ longi
704
+ latit
705
+ luminos
706
+ mai
707
+ mod
708
+ minor
709
+ nisi
710
+ natal
711
+ nunc
712
+ offen
713
+ obstrinx
714
+ operatio
715
+ parit
716
+ ration
717
+ speci
718
+ surg
719
+ tot
720
+ urb
721
+ velociter
722
+ vacu
723
+ v32perfactivesub3p
724
+ v41futpassiveind3p
725
+ xxxdx
726
+ adtul
727
+ ##smcard
728
+ praefer
729
+ pron51ablsc
730
+ consul
731
+ vpar32accsffutpassiveppl
732
+ vpar21nomsxpresactiveppl
733
+ v31futactiveind3p
734
+ v31prespassiveind3p
735
+ n21locpm
736
+ infusion
737
+ infantil
738
+ vpar31gensmperfpassiveppl
739
+ vpar31vocsmperfpassiveppl
740
+ adj11accsccomp
741
+ adj11genpmpos
742
+ num12datsmord
743
+ num11ablsmcard
744
+ videlicet
745
+ adj32genpxpos
746
+ digest
747
+ disposit
748
+ sexagesim
749
+ v11futactiveimp2s
750
+ vpar11accpffutactiveppl
751
+ vpar11accpmperfpassiveppl
752
+ auctoritat
753
+ undique
754
+ cleopatr
755
+ classis
756
+ columb
757
+ effugav
758
+ effusio
759
+ negligenter
760
+ suspic
761
+ tremefact
762
+ v73presactiveind2searly
763
+ profecto
764
+ adj13datsxposinfreq
765
+ aegypt
766
+ circumfus
767
+ daemon
768
+ offend
769
+ special