kiansheik commited on
Commit
79bb7c9
1 Parent(s): fb73f01

finer with more change

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. model.safetensors +1 -1
  3. special_tokens_map.json +105 -105
  4. tokenizer_config.json +87 -87
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "models/t5-1.0/",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
 
1
  {
2
+ "_name_or_path": "models/t5-1.2_space/",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7407150199f25a66d3268c2b4d94f2f965616a84fc9451a83bd1b8faba868982
3
  size 242181160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fe61be34df708adcf77500af072bfbd4f46352cd355b889ed6b3246145db0bd
3
  size 242181160
special_tokens_map.json CHANGED
@@ -1,735 +1,735 @@
1
  {
2
  "additional_special_tokens": [
3
  {
4
- "content": "e'ym",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
- "content": "îepé",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
15
  "single_word": false
16
  },
17
  {
18
- "content": "[ROOT]",
19
  "lstrip": false,
20
  "normalized": false,
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
  {
25
- "content": "[PLURIFORM_PREFIX:S]",
26
  "lstrip": false,
27
  "normalized": false,
28
  "rstrip": false,
29
  "single_word": false
30
  },
31
  {
32
- "content": "[OBJECT:1ps]",
33
  "lstrip": false,
34
  "normalized": false,
35
  "rstrip": false,
36
  "single_word": false
37
  },
38
  {
39
- "content": "[GERUND_SUFFIX:CLASS_1]",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": false,
43
  "single_word": false
44
  },
45
  {
46
- "content": "[OBJECT:2ps:SUBJECT_1P]",
47
  "lstrip": false,
48
  "normalized": false,
49
  "rstrip": false,
50
  "single_word": false
51
  },
52
  {
53
- "content": "[NEGATION_PARTICLE:NA]",
54
  "lstrip": false,
55
  "normalized": false,
56
  "rstrip": false,
57
  "single_word": false
58
  },
59
  {
60
- "content": "îe",
61
  "lstrip": false,
62
  "normalized": false,
63
  "rstrip": false,
64
  "single_word": false
65
  },
66
  {
67
- "content": "́",
68
  "lstrip": false,
69
  "normalized": false,
70
  "rstrip": false,
71
  "single_word": false
72
  },
73
  {
74
- "content": "amo",
75
  "lstrip": false,
76
  "normalized": false,
77
  "rstrip": false,
78
  "single_word": false
79
  },
80
  {
81
- "content": "[GERUND_SUBJECT_PREFIX:1ppi]",
82
  "lstrip": false,
83
  "normalized": false,
84
  "rstrip": false,
85
  "single_word": false
86
  },
87
  {
88
- "content": "îa",
89
  "lstrip": false,
90
  "normalized": false,
91
  "rstrip": false,
92
  "single_word": false
93
  },
94
  {
95
- "content": "umẽ",
96
  "lstrip": false,
97
  "normalized": false,
98
  "rstrip": false,
99
  "single_word": false
100
  },
101
  {
102
- "content": "[GERUND_SUBJECT_PREFIX:1ps]",
103
  "lstrip": false,
104
  "normalized": false,
105
  "rstrip": false,
106
  "single_word": false
107
  },
108
  {
109
- "content": "o",
110
  "lstrip": false,
111
  "normalized": false,
112
  "rstrip": false,
113
  "single_word": false
114
  },
115
  {
116
- "content": "[SUBJECT_PREFIX:1ppi]",
117
  "lstrip": false,
118
  "normalized": false,
119
  "rstrip": false,
120
  "single_word": false
121
  },
122
  {
123
- "content": "[IMPERATIVE_PREFIX:2pp]",
124
  "lstrip": false,
125
  "normalized": false,
126
  "rstrip": false,
127
  "single_word": false
128
  },
129
  {
130
- "content": "xe",
131
  "lstrip": false,
132
  "normalized": false,
133
  "rstrip": false,
134
  "single_word": false
135
  },
136
  {
137
- "content": "[SUBJECT_PREFIX:1ps]",
138
  "lstrip": false,
139
  "normalized": false,
140
  "rstrip": false,
141
  "single_word": false
142
  },
143
  {
144
- "content": "[PLURIFORM_PREFIX:R]",
145
  "lstrip": false,
146
  "normalized": false,
147
  "rstrip": false,
148
  "single_word": false
149
  },
150
  {
151
- "content": "í",
152
  "lstrip": false,
153
  "normalized": false,
154
  "rstrip": false,
155
  "single_word": false
156
  },
157
  {
158
- "content": "n'",
159
  "lstrip": false,
160
  "normalized": false,
161
  "rstrip": false,
162
  "single_word": false
163
  },
164
  {
165
- "content": "[OBJECT:2pp:SUBJECT_1P]",
166
  "lstrip": false,
167
  "normalized": false,
168
  "rstrip": false,
169
  "single_word": false
170
  },
171
  {
172
- "content": "[PERMISSIVE_PREFIX:CONSONANT]",
173
  "lstrip": false,
174
  "normalized": false,
175
  "rstrip": false,
176
  "single_word": false
177
  },
178
  {
179
- "content": "[SUBJECT:1ps]",
180
  "lstrip": false,
181
  "normalized": false,
182
  "rstrip": false,
183
  "single_word": false
184
  },
185
  {
186
- "content": "î",
187
  "lstrip": false,
188
  "normalized": false,
189
  "rstrip": false,
190
  "single_word": false
191
  },
192
  {
193
- "content": "[SUBJECT:2ps]",
194
  "lstrip": false,
195
  "normalized": false,
196
  "rstrip": false,
197
  "single_word": false
198
  },
199
  {
200
- "content": "[OBJECT_MARKER:3p:PLURIFORM_PREFIX:MONOSYLLABIC]",
201
  "lstrip": false,
202
  "normalized": false,
203
  "rstrip": false,
204
  "single_word": false
205
  },
206
  {
207
- "content": "pe",
208
  "lstrip": false,
209
  "normalized": false,
210
  "rstrip": false,
211
  "single_word": false
212
  },
213
  {
214
- "content": "[NEGATION_PREFIX]",
215
  "lstrip": false,
216
  "normalized": false,
217
  "rstrip": false,
218
  "single_word": false
219
  },
220
  {
221
- "content": "[OBJECT:2pp]",
222
  "lstrip": false,
223
  "normalized": false,
224
  "rstrip": false,
225
  "single_word": false
226
  },
227
  {
228
- "content": "abo",
229
  "lstrip": false,
230
  "normalized": false,
231
  "rstrip": false,
232
  "single_word": false
233
  },
234
  {
235
- "content": "na",
236
  "lstrip": false,
237
  "normalized": false,
238
  "rstrip": false,
239
  "single_word": false
240
  },
241
  {
242
- "content": "[GERUND_SUFFIX:CLASS_1:R]",
243
  "lstrip": false,
244
  "normalized": false,
245
  "rstrip": false,
246
  "single_word": false
247
  },
248
  {
249
- "content": "[SUBJECT_PREFIX:3p]",
250
  "lstrip": false,
251
  "normalized": false,
252
  "rstrip": false,
253
  "single_word": false
254
  },
255
  {
256
- "content": "[OBJECT:1ppi]",
257
  "lstrip": false,
258
  "normalized": false,
259
  "rstrip": false,
260
  "single_word": false
261
  },
262
  {
263
- "content": "[NEGATION_PARTICLE:UME]",
264
  "lstrip": false,
265
  "normalized": false,
266
  "rstrip": false,
267
  "single_word": false
268
  },
269
  {
270
- "content": "îandé",
271
  "lstrip": false,
272
  "normalized": false,
273
  "rstrip": false,
274
  "single_word": false
275
  },
276
  {
277
- "content": "[GERUND_SUFFIX:CLASS_1:ORAL_VOWEL]",
278
  "lstrip": false,
279
  "normalized": false,
280
  "rstrip": false,
281
  "single_word": false
282
  },
283
  {
284
- "content": "[NEGATION_SUFFIX:CONSONANT_ENDING]",
285
  "lstrip": false,
286
  "normalized": false,
287
  "rstrip": false,
288
  "single_word": false
289
  },
290
  {
291
- "content": "[GERUND_SUBJECT_PREFIX:2pp]",
292
  "lstrip": false,
293
  "normalized": false,
294
  "rstrip": false,
295
  "single_word": false
296
  },
297
  {
298
- "content": "[CIRCUMSTANTIAL_SUFFIX:CONSONANT_ENDING]",
299
  "lstrip": false,
300
  "normalized": false,
301
  "rstrip": false,
302
  "single_word": false
303
  },
304
  {
305
- "content": "[GERUND_SUFFIX:CLASS_2:ORAL_VOWEL_ENDING]",
306
  "lstrip": false,
307
  "normalized": false,
308
  "rstrip": false,
309
  "single_word": false
310
  },
311
  {
312
- "content": "[GERUND_SUBJECT_PREFIX:2ps]",
313
  "lstrip": false,
314
  "normalized": false,
315
  "rstrip": false,
316
  "single_word": false
317
  },
318
  {
319
- "content": "gûi",
320
  "lstrip": false,
321
  "normalized": false,
322
  "rstrip": false,
323
  "single_word": false
324
  },
325
  {
326
- "content": "ixé",
327
  "lstrip": false,
328
  "normalized": false,
329
  "rstrip": false,
330
  "single_word": false
331
  },
332
  {
333
- "content": "namo",
334
  "lstrip": false,
335
  "normalized": false,
336
  "rstrip": false,
337
  "single_word": false
338
  },
339
  {
340
- "content": "[OBJECT:3p]",
341
  "lstrip": false,
342
  "normalized": false,
343
  "rstrip": false,
344
  "single_word": false
345
  },
346
  {
347
- "content": "ere",
348
  "lstrip": false,
349
  "normalized": false,
350
  "rstrip": false,
351
  "single_word": false
352
  },
353
  {
354
- "content": "[SUBJECT:3p:DIRECT]",
355
  "lstrip": false,
356
  "normalized": false,
357
  "rstrip": false,
358
  "single_word": false
359
  },
360
  {
361
- "content": "mo",
362
  "lstrip": false,
363
  "normalized": false,
364
  "rstrip": false,
365
  "single_word": false
366
  },
367
  {
368
- "content": "[GERUND_SUFFIX:CLASS_2:NASAL_VOWEL_ENDING]",
369
  "lstrip": false,
370
  "normalized": false,
371
  "rstrip": false,
372
  "single_word": false
373
  },
374
  {
375
- "content": "[SUBJECT:1ppe]",
376
  "lstrip": false,
377
  "normalized": false,
378
  "rstrip": false,
379
  "single_word": false
380
  },
381
  {
382
- "content": "[GERUND_SUBJECT_PREFIX:3p]",
383
  "lstrip": false,
384
  "normalized": false,
385
  "rstrip": false,
386
  "single_word": false
387
  },
388
  {
389
- "content": "[OBJECT_MARKER:3p:DEFAULT]",
390
  "lstrip": false,
391
  "normalized": false,
392
  "rstrip": false,
393
  "single_word": false
394
  },
395
  {
396
- "content": "[SUBJECT:1ppi]",
397
  "lstrip": false,
398
  "normalized": false,
399
  "rstrip": false,
400
  "single_word": false
401
  },
402
  {
403
- "content": "[GERUND_SUFFIX:CLASS_1:NASAL_VOWEL]",
404
  "lstrip": false,
405
  "normalized": false,
406
  "rstrip": false,
407
  "single_word": false
408
  },
409
  {
410
- "content": "peẽ",
411
  "lstrip": false,
412
  "normalized": false,
413
  "rstrip": false,
414
  "single_word": false
415
  },
416
  {
417
- "content": "s",
418
  "lstrip": false,
419
  "normalized": false,
420
  "rstrip": false,
421
  "single_word": false
422
  },
423
  {
424
- "content": "[SUBJECT:3p]",
425
  "lstrip": false,
426
  "normalized": false,
427
  "rstrip": false,
428
  "single_word": false
429
  },
430
  {
431
- "content": "û",
432
  "lstrip": false,
433
  "normalized": false,
434
  "rstrip": false,
435
  "single_word": false
436
  },
437
  {
438
- "content": "[SUBJECT:2ps:OBJECT_1P]",
439
  "lstrip": false,
440
  "normalized": false,
441
  "rstrip": false,
442
  "single_word": false
443
  },
444
  {
445
- "content": "îos",
446
  "lstrip": false,
447
  "normalized": false,
448
  "rstrip": false,
449
  "single_word": false
450
  },
451
  {
452
- "content": "nde",
453
  "lstrip": false,
454
  "normalized": false,
455
  "rstrip": false,
456
  "single_word": false
457
  },
458
  {
459
- "content": "endé",
460
  "lstrip": false,
461
  "normalized": false,
462
  "rstrip": false,
463
  "single_word": false
464
  },
465
  {
466
- "content": "[OBJECT:MUTUAL]",
467
  "lstrip": false,
468
  "normalized": false,
469
  "rstrip": false,
470
  "single_word": false
471
  },
472
  {
473
- "content": "[GERUND_SUFFIX:CLASS_1:CONSONANT]",
474
  "lstrip": false,
475
  "normalized": false,
476
  "rstrip": false,
477
  "single_word": false
478
  },
479
  {
480
- "content": "oré",
481
  "lstrip": false,
482
  "normalized": false,
483
  "rstrip": false,
484
  "single_word": false
485
  },
486
  {
487
- "content": "t",
488
  "lstrip": false,
489
  "normalized": false,
490
  "rstrip": false,
491
  "single_word": false
492
  },
493
  {
494
- "content": "bo",
495
  "lstrip": false,
496
  "normalized": false,
497
  "rstrip": false,
498
  "single_word": false
499
  },
500
  {
501
- "content": "[GERUND_SUFFIX:CLASS_1:IYU]",
502
  "lstrip": false,
503
  "normalized": false,
504
  "rstrip": false,
505
  "single_word": false
506
  },
507
  {
508
- "content": "r",
509
  "lstrip": false,
510
  "normalized": false,
511
  "rstrip": false,
512
  "single_word": false
513
  },
514
  {
515
- "content": "i",
516
  "lstrip": false,
517
  "normalized": false,
518
  "rstrip": false,
519
  "single_word": false
520
  },
521
  {
522
- "content": "ramo",
523
  "lstrip": false,
524
  "normalized": false,
525
  "rstrip": false,
526
  "single_word": false
527
  },
528
  {
529
- "content": "[OBJECT:1ppe]",
530
  "lstrip": false,
531
  "normalized": false,
532
  "rstrip": false,
533
  "single_word": false
534
  },
535
  {
536
- "content": "[OBJECT:3p:MONOSYLLABIC]",
537
  "lstrip": false,
538
  "normalized": false,
539
  "rstrip": false,
540
  "single_word": false
541
  },
542
  {
543
- "content": "ta",
544
  "lstrip": false,
545
  "normalized": false,
546
  "rstrip": false,
547
  "single_word": false
548
  },
549
  {
550
- "content": "[SUBJECT_PREFIX:2ps]",
551
  "lstrip": false,
552
  "normalized": false,
553
  "rstrip": false,
554
  "single_word": false
555
  },
556
  {
557
- "content": "a'e",
558
  "lstrip": false,
559
  "normalized": false,
560
  "rstrip": false,
561
  "single_word": false
562
  },
563
  {
564
- "content": "[OBJECT:DIRECT]",
565
  "lstrip": false,
566
  "normalized": false,
567
  "rstrip": false,
568
  "single_word": false
569
  },
570
  {
571
- "content": "peîepé",
572
  "lstrip": false,
573
  "normalized": false,
574
  "rstrip": false,
575
  "single_word": false
576
  },
577
  {
578
- "content": "a",
579
  "lstrip": false,
580
  "normalized": false,
581
  "rstrip": false,
582
  "single_word": false
583
  },
584
  {
585
- "content": "[GERUND_SUBJECT_PREFIX:1ppe]",
586
  "lstrip": false,
587
  "normalized": false,
588
  "rstrip": false,
589
  "single_word": false
590
  },
591
  {
592
- "content": "[GERUND_SUFFIX:CLASS_2:DEFAULT]",
593
  "lstrip": false,
594
  "normalized": false,
595
  "rstrip": false,
596
  "single_word": false
597
  },
598
  {
599
- "content": "[SUBJECT:2pp]",
600
  "lstrip": false,
601
  "normalized": false,
602
  "rstrip": false,
603
  "single_word": false
604
  },
605
  {
606
- "content": "[GERUND_SUFFIX:CLASS_1:NASAL_IYU]",
607
  "lstrip": false,
608
  "normalized": false,
609
  "rstrip": false,
610
  "single_word": false
611
  },
612
  {
613
- "content": "[OBJECT:2ps]",
614
  "lstrip": false,
615
  "normalized": false,
616
  "rstrip": false,
617
  "single_word": false
618
  },
619
  {
620
- "content": "[SUBJECT_PREFIX:1ppe]",
621
  "lstrip": false,
622
  "normalized": false,
623
  "rstrip": false,
624
  "single_word": false
625
  },
626
  {
627
- "content": "[NEGATION_SUFFIX]",
628
  "lstrip": false,
629
  "normalized": false,
630
  "rstrip": false,
631
  "single_word": false
632
  },
633
  {
634
- "content": "e",
635
  "lstrip": false,
636
  "normalized": false,
637
  "rstrip": false,
638
  "single_word": false
639
  },
640
  {
641
- "content": "[PERMISSIVE_PREFIX:VOWEL]",
642
  "lstrip": false,
643
  "normalized": false,
644
  "rstrip": false,
645
  "single_word": false
646
  },
647
  {
648
- "content": "[OBJECT:REFLEXIVE]",
649
  "lstrip": false,
650
  "normalized": false,
651
  "rstrip": false,
652
  "single_word": false
653
  },
654
  {
655
- "content": "pa",
656
  "lstrip": false,
657
  "normalized": false,
658
  "rstrip": false,
659
  "single_word": false
660
  },
661
  {
662
- "content": "[SUBJECT_PREFIX:2pp]",
663
  "lstrip": false,
664
  "normalized": false,
665
  "rstrip": false,
666
  "single_word": false
667
  },
668
  {
669
- "content": "[GERUND_SUFFIX:CLASS_1:B]",
670
  "lstrip": false,
671
  "normalized": false,
672
  "rstrip": false,
673
  "single_word": false
674
  },
675
  {
676
- "content": "[SUBJECT:2pp:OBJECT_1P]",
677
  "lstrip": false,
678
  "normalized": false,
679
  "rstrip": false,
680
  "single_word": false
681
  },
682
  {
683
- "content": "oro",
684
  "lstrip": false,
685
  "normalized": false,
686
  "rstrip": false,
687
  "single_word": false
688
  },
689
  {
690
- "content": "[NEGATION_SUFFIX:VOWEL_ENDING]",
691
  "lstrip": false,
692
  "normalized": false,
693
  "rstrip": false,
694
  "single_word": false
695
  },
696
  {
697
- "content": "[CIRCUMSTANTIAL_SUFFIX:VOWEL_ENDING]",
698
  "lstrip": false,
699
  "normalized": false,
700
  "rstrip": false,
701
  "single_word": false
702
  },
703
  {
704
- "content": "[CIRCUMSTANTIAL_SUFFIX:NULL_ENDING]",
705
  "lstrip": false,
706
  "normalized": false,
707
  "rstrip": false,
708
  "single_word": false
709
  },
710
  {
711
- "content": "[IMPERATIVE_PREFIX:2ps]",
712
  "lstrip": false,
713
  "normalized": false,
714
  "rstrip": false,
715
  "single_word": false
716
  },
717
  {
718
- "content": "[OBJECT_MARKER:3p:MONOSYLLABIC]",
719
  "lstrip": false,
720
  "normalized": false,
721
  "rstrip": false,
722
  "single_word": false
723
  },
724
  {
725
- "content": "opo",
726
  "lstrip": false,
727
  "normalized": false,
728
  "rstrip": false,
729
  "single_word": false
730
  },
731
  {
732
- "content": "îo",
733
  "lstrip": false,
734
  "normalized": false,
735
  "rstrip": false,
 
1
  {
2
  "additional_special_tokens": [
3
  {
4
+ "content": "[SUBJECT:3p:DIRECT]",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
+ "content": "[GERUND_SUBJECT_PREFIX:1ppi]",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
15
  "single_word": false
16
  },
17
  {
18
+ "content": "[OBJECT:DIRECT]",
19
  "lstrip": false,
20
  "normalized": false,
21
  "rstrip": false,
22
  "single_word": false
23
  },
24
  {
25
+ "content": "î",
26
  "lstrip": false,
27
  "normalized": false,
28
  "rstrip": false,
29
  "single_word": false
30
  },
31
  {
32
+ "content": "îepé",
33
  "lstrip": false,
34
  "normalized": false,
35
  "rstrip": false,
36
  "single_word": false
37
  },
38
  {
39
+ "content": "e",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": false,
43
  "single_word": false
44
  },
45
  {
46
+ "content": "[OBJECT:2pp]",
47
  "lstrip": false,
48
  "normalized": false,
49
  "rstrip": false,
50
  "single_word": false
51
  },
52
  {
53
+ "content": "ta",
54
  "lstrip": false,
55
  "normalized": false,
56
  "rstrip": false,
57
  "single_word": false
58
  },
59
  {
60
+ "content": "n'",
61
  "lstrip": false,
62
  "normalized": false,
63
  "rstrip": false,
64
  "single_word": false
65
  },
66
  {
67
+ "content": "peẽ",
68
  "lstrip": false,
69
  "normalized": false,
70
  "rstrip": false,
71
  "single_word": false
72
  },
73
  {
74
+ "content": "[SUBJECT:2pp]",
75
  "lstrip": false,
76
  "normalized": false,
77
  "rstrip": false,
78
  "single_word": false
79
  },
80
  {
81
+ "content": "îe",
82
  "lstrip": false,
83
  "normalized": false,
84
  "rstrip": false,
85
  "single_word": false
86
  },
87
  {
88
+ "content": "[GERUND_SUBJECT_PREFIX:3p]",
89
  "lstrip": false,
90
  "normalized": false,
91
  "rstrip": false,
92
  "single_word": false
93
  },
94
  {
95
+ "content": "[GERUND_SUBJECT_PREFIX:2pp]",
96
  "lstrip": false,
97
  "normalized": false,
98
  "rstrip": false,
99
  "single_word": false
100
  },
101
  {
102
+ "content": "[NEGATION_PARTICLE:NA]",
103
  "lstrip": false,
104
  "normalized": false,
105
  "rstrip": false,
106
  "single_word": false
107
  },
108
  {
109
+ "content": "[IMPERATIVE_PREFIX:2ps]",
110
  "lstrip": false,
111
  "normalized": false,
112
  "rstrip": false,
113
  "single_word": false
114
  },
115
  {
116
+ "content": "îos",
117
  "lstrip": false,
118
  "normalized": false,
119
  "rstrip": false,
120
  "single_word": false
121
  },
122
  {
123
+ "content": "[GERUND_SUFFIX:CLASS_1:NASAL_IYU]",
124
  "lstrip": false,
125
  "normalized": false,
126
  "rstrip": false,
127
  "single_word": false
128
  },
129
  {
130
+ "content": "[PLURIFORM_PREFIX:S]",
131
  "lstrip": false,
132
  "normalized": false,
133
  "rstrip": false,
134
  "single_word": false
135
  },
136
  {
137
+ "content": "û",
138
  "lstrip": false,
139
  "normalized": false,
140
  "rstrip": false,
141
  "single_word": false
142
  },
143
  {
144
+ "content": "[OBJECT_MARKER:3p:PLURIFORM_PREFIX:MONOSYLLABIC]",
145
  "lstrip": false,
146
  "normalized": false,
147
  "rstrip": false,
148
  "single_word": false
149
  },
150
  {
151
+ "content": "[OBJECT:1ppi]",
152
  "lstrip": false,
153
  "normalized": false,
154
  "rstrip": false,
155
  "single_word": false
156
  },
157
  {
158
+ "content": "abo",
159
  "lstrip": false,
160
  "normalized": false,
161
  "rstrip": false,
162
  "single_word": false
163
  },
164
  {
165
+ "content": "[GERUND_SUFFIX:CLASS_1]",
166
  "lstrip": false,
167
  "normalized": false,
168
  "rstrip": false,
169
  "single_word": false
170
  },
171
  {
172
+ "content": "[GERUND_SUFFIX:CLASS_1:IYU]",
173
  "lstrip": false,
174
  "normalized": false,
175
  "rstrip": false,
176
  "single_word": false
177
  },
178
  {
179
+ "content": "îo",
180
  "lstrip": false,
181
  "normalized": false,
182
  "rstrip": false,
183
  "single_word": false
184
  },
185
  {
186
+ "content": "[NEGATION_SUFFIX]",
187
  "lstrip": false,
188
  "normalized": false,
189
  "rstrip": false,
190
  "single_word": false
191
  },
192
  {
193
+ "content": "i",
194
  "lstrip": false,
195
  "normalized": false,
196
  "rstrip": false,
197
  "single_word": false
198
  },
199
  {
200
+ "content": "[GERUND_SUBJECT_PREFIX:1ppe]",
201
  "lstrip": false,
202
  "normalized": false,
203
  "rstrip": false,
204
  "single_word": false
205
  },
206
  {
207
+ "content": "[SUBJECT:3p]",
208
  "lstrip": false,
209
  "normalized": false,
210
  "rstrip": false,
211
  "single_word": false
212
  },
213
  {
214
+ "content": "[IMPERATIVE_PREFIX:2pp]",
215
  "lstrip": false,
216
  "normalized": false,
217
  "rstrip": false,
218
  "single_word": false
219
  },
220
  {
221
+ "content": "́",
222
  "lstrip": false,
223
  "normalized": false,
224
  "rstrip": false,
225
  "single_word": false
226
  },
227
  {
228
+ "content": "xe",
229
  "lstrip": false,
230
  "normalized": false,
231
  "rstrip": false,
232
  "single_word": false
233
  },
234
  {
235
+ "content": "a'e",
236
  "lstrip": false,
237
  "normalized": false,
238
  "rstrip": false,
239
  "single_word": false
240
  },
241
  {
242
+ "content": "t",
243
  "lstrip": false,
244
  "normalized": false,
245
  "rstrip": false,
246
  "single_word": false
247
  },
248
  {
249
+ "content": "[SUBJECT:1ps]",
250
  "lstrip": false,
251
  "normalized": false,
252
  "rstrip": false,
253
  "single_word": false
254
  },
255
  {
256
+ "content": "[SUBJECT:1ppe]",
257
  "lstrip": false,
258
  "normalized": false,
259
  "rstrip": false,
260
  "single_word": false
261
  },
262
  {
263
+ "content": "a",
264
  "lstrip": false,
265
  "normalized": false,
266
  "rstrip": false,
267
  "single_word": false
268
  },
269
  {
270
+ "content": "[SUBJECT_PREFIX:1ppe]",
271
  "lstrip": false,
272
  "normalized": false,
273
  "rstrip": false,
274
  "single_word": false
275
  },
276
  {
277
+ "content": "amo",
278
  "lstrip": false,
279
  "normalized": false,
280
  "rstrip": false,
281
  "single_word": false
282
  },
283
  {
284
+ "content": "[OBJECT:2ps]",
285
  "lstrip": false,
286
  "normalized": false,
287
  "rstrip": false,
288
  "single_word": false
289
  },
290
  {
291
+ "content": "[OBJECT:1ppe]",
292
  "lstrip": false,
293
  "normalized": false,
294
  "rstrip": false,
295
  "single_word": false
296
  },
297
  {
298
+ "content": "[NEGATION_SUFFIX:CONSONANT_ENDING]",
299
  "lstrip": false,
300
  "normalized": false,
301
  "rstrip": false,
302
  "single_word": false
303
  },
304
  {
305
+ "content": "[OBJECT:MUTUAL]",
306
  "lstrip": false,
307
  "normalized": false,
308
  "rstrip": false,
309
  "single_word": false
310
  },
311
  {
312
+ "content": "[GERUND_SUFFIX:CLASS_2:ORAL_VOWEL_ENDING]",
313
  "lstrip": false,
314
  "normalized": false,
315
  "rstrip": false,
316
  "single_word": false
317
  },
318
  {
319
+ "content": "[NEGATION_PREFIX]",
320
  "lstrip": false,
321
  "normalized": false,
322
  "rstrip": false,
323
  "single_word": false
324
  },
325
  {
326
+ "content": "[CIRCUMSTANTIAL_SUFFIX:NULL_ENDING]",
327
  "lstrip": false,
328
  "normalized": false,
329
  "rstrip": false,
330
  "single_word": false
331
  },
332
  {
333
+ "content": "[SUBJECT:1ppi]",
334
  "lstrip": false,
335
  "normalized": false,
336
  "rstrip": false,
337
  "single_word": false
338
  },
339
  {
340
+ "content": "[PERMISSIVE_PREFIX:VOWEL]",
341
  "lstrip": false,
342
  "normalized": false,
343
  "rstrip": false,
344
  "single_word": false
345
  },
346
  {
347
+ "content": "pe",
348
  "lstrip": false,
349
  "normalized": false,
350
  "rstrip": false,
351
  "single_word": false
352
  },
353
  {
354
+ "content": "nde",
355
  "lstrip": false,
356
  "normalized": false,
357
  "rstrip": false,
358
  "single_word": false
359
  },
360
  {
361
+ "content": "opo",
362
  "lstrip": false,
363
  "normalized": false,
364
  "rstrip": false,
365
  "single_word": false
366
  },
367
  {
368
+ "content": "[OBJECT_MARKER:3p:DEFAULT]",
369
  "lstrip": false,
370
  "normalized": false,
371
  "rstrip": false,
372
  "single_word": false
373
  },
374
  {
375
+ "content": "[GERUND_SUBJECT_PREFIX:2ps]",
376
  "lstrip": false,
377
  "normalized": false,
378
  "rstrip": false,
379
  "single_word": false
380
  },
381
  {
382
+ "content": "[OBJECT:3p]",
383
  "lstrip": false,
384
  "normalized": false,
385
  "rstrip": false,
386
  "single_word": false
387
  },
388
  {
389
+ "content": "îandé",
390
  "lstrip": false,
391
  "normalized": false,
392
  "rstrip": false,
393
  "single_word": false
394
  },
395
  {
396
+ "content": "[OBJECT:2pp:SUBJECT_1P]",
397
  "lstrip": false,
398
  "normalized": false,
399
  "rstrip": false,
400
  "single_word": false
401
  },
402
  {
403
+ "content": "gûi",
404
  "lstrip": false,
405
  "normalized": false,
406
  "rstrip": false,
407
  "single_word": false
408
  },
409
  {
410
+ "content": "[CIRCUMSTANTIAL_SUFFIX:VOWEL_ENDING]",
411
  "lstrip": false,
412
  "normalized": false,
413
  "rstrip": false,
414
  "single_word": false
415
  },
416
  {
417
+ "content": "[OBJECT_MARKER:3p:MONOSYLLABIC]",
418
  "lstrip": false,
419
  "normalized": false,
420
  "rstrip": false,
421
  "single_word": false
422
  },
423
  {
424
+ "content": "peîepé",
425
  "lstrip": false,
426
  "normalized": false,
427
  "rstrip": false,
428
  "single_word": false
429
  },
430
  {
431
+ "content": "[GERUND_SUFFIX:CLASS_1:R]",
432
  "lstrip": false,
433
  "normalized": false,
434
  "rstrip": false,
435
  "single_word": false
436
  },
437
  {
438
+ "content": "endé",
439
  "lstrip": false,
440
  "normalized": false,
441
  "rstrip": false,
442
  "single_word": false
443
  },
444
  {
445
+ "content": "namo",
446
  "lstrip": false,
447
  "normalized": false,
448
  "rstrip": false,
449
  "single_word": false
450
  },
451
  {
452
+ "content": "[SUBJECT:2pp:OBJECT_1P]",
453
  "lstrip": false,
454
  "normalized": false,
455
  "rstrip": false,
456
  "single_word": false
457
  },
458
  {
459
+ "content": "mo",
460
  "lstrip": false,
461
  "normalized": false,
462
  "rstrip": false,
463
  "single_word": false
464
  },
465
  {
466
+ "content": "bo",
467
  "lstrip": false,
468
  "normalized": false,
469
  "rstrip": false,
470
  "single_word": false
471
  },
472
  {
473
+ "content": "[SUBJECT_PREFIX:2pp]",
474
  "lstrip": false,
475
  "normalized": false,
476
  "rstrip": false,
477
  "single_word": false
478
  },
479
  {
480
+ "content": "[CIRCUMSTANTIAL_SUFFIX:CONSONANT_ENDING]",
481
  "lstrip": false,
482
  "normalized": false,
483
  "rstrip": false,
484
  "single_word": false
485
  },
486
  {
487
+ "content": "[ROOT]",
488
  "lstrip": false,
489
  "normalized": false,
490
  "rstrip": false,
491
  "single_word": false
492
  },
493
  {
494
+ "content": "[NEGATION_PARTICLE:UME]",
495
  "lstrip": false,
496
  "normalized": false,
497
  "rstrip": false,
498
  "single_word": false
499
  },
500
  {
501
+ "content": "e'ym",
502
  "lstrip": false,
503
  "normalized": false,
504
  "rstrip": false,
505
  "single_word": false
506
  },
507
  {
508
+ "content": "[SUBJECT_PREFIX:3p]",
509
  "lstrip": false,
510
  "normalized": false,
511
  "rstrip": false,
512
  "single_word": false
513
  },
514
  {
515
+ "content": "r",
516
  "lstrip": false,
517
  "normalized": false,
518
  "rstrip": false,
519
  "single_word": false
520
  },
521
  {
522
+ "content": "[NEGATION_SUFFIX:VOWEL_ENDING]",
523
  "lstrip": false,
524
  "normalized": false,
525
  "rstrip": false,
526
  "single_word": false
527
  },
528
  {
529
+ "content": "[SUBJECT_PREFIX:1ps]",
530
  "lstrip": false,
531
  "normalized": false,
532
  "rstrip": false,
533
  "single_word": false
534
  },
535
  {
536
+ "content": "[GERUND_SUFFIX:CLASS_1:ORAL_VOWEL]",
537
  "lstrip": false,
538
  "normalized": false,
539
  "rstrip": false,
540
  "single_word": false
541
  },
542
  {
543
+ "content": "ixé",
544
  "lstrip": false,
545
  "normalized": false,
546
  "rstrip": false,
547
  "single_word": false
548
  },
549
  {
550
+ "content": "pa",
551
  "lstrip": false,
552
  "normalized": false,
553
  "rstrip": false,
554
  "single_word": false
555
  },
556
  {
557
+ "content": "ramo",
558
  "lstrip": false,
559
  "normalized": false,
560
  "rstrip": false,
561
  "single_word": false
562
  },
563
  {
564
+ "content": "ere",
565
  "lstrip": false,
566
  "normalized": false,
567
  "rstrip": false,
568
  "single_word": false
569
  },
570
  {
571
+ "content": "[OBJECT:REFLEXIVE]",
572
  "lstrip": false,
573
  "normalized": false,
574
  "rstrip": false,
575
  "single_word": false
576
  },
577
  {
578
+ "content": "[GERUND_SUFFIX:CLASS_1:NASAL_VOWEL]",
579
  "lstrip": false,
580
  "normalized": false,
581
  "rstrip": false,
582
  "single_word": false
583
  },
584
  {
585
+ "content": "na",
586
  "lstrip": false,
587
  "normalized": false,
588
  "rstrip": false,
589
  "single_word": false
590
  },
591
  {
592
+ "content": "[GERUND_SUFFIX:CLASS_1:B]",
593
  "lstrip": false,
594
  "normalized": false,
595
  "rstrip": false,
596
  "single_word": false
597
  },
598
  {
599
+ "content": "[OBJECT:3p:MONOSYLLABIC]",
600
  "lstrip": false,
601
  "normalized": false,
602
  "rstrip": false,
603
  "single_word": false
604
  },
605
  {
606
+ "content": "[GERUND_SUFFIX:CLASS_1:CONSONANT]",
607
  "lstrip": false,
608
  "normalized": false,
609
  "rstrip": false,
610
  "single_word": false
611
  },
612
  {
613
+ "content": "[OBJECT:2ps:SUBJECT_1P]",
614
  "lstrip": false,
615
  "normalized": false,
616
  "rstrip": false,
617
  "single_word": false
618
  },
619
  {
620
+ "content": "[GERUND_SUBJECT_PREFIX:1ps]",
621
  "lstrip": false,
622
  "normalized": false,
623
  "rstrip": false,
624
  "single_word": false
625
  },
626
  {
627
+ "content": "oro",
628
  "lstrip": false,
629
  "normalized": false,
630
  "rstrip": false,
631
  "single_word": false
632
  },
633
  {
634
+ "content": "[PERMISSIVE_PREFIX:CONSONANT]",
635
  "lstrip": false,
636
  "normalized": false,
637
  "rstrip": false,
638
  "single_word": false
639
  },
640
  {
641
+ "content": "í",
642
  "lstrip": false,
643
  "normalized": false,
644
  "rstrip": false,
645
  "single_word": false
646
  },
647
  {
648
+ "content": "oré",
649
  "lstrip": false,
650
  "normalized": false,
651
  "rstrip": false,
652
  "single_word": false
653
  },
654
  {
655
+ "content": "umẽ",
656
  "lstrip": false,
657
  "normalized": false,
658
  "rstrip": false,
659
  "single_word": false
660
  },
661
  {
662
+ "content": "[SUBJECT:2ps]",
663
  "lstrip": false,
664
  "normalized": false,
665
  "rstrip": false,
666
  "single_word": false
667
  },
668
  {
669
+ "content": "[PLURIFORM_PREFIX:R]",
670
  "lstrip": false,
671
  "normalized": false,
672
  "rstrip": false,
673
  "single_word": false
674
  },
675
  {
676
+ "content": "o",
677
  "lstrip": false,
678
  "normalized": false,
679
  "rstrip": false,
680
  "single_word": false
681
  },
682
  {
683
+ "content": "[SUBJECT:2ps:OBJECT_1P]",
684
  "lstrip": false,
685
  "normalized": false,
686
  "rstrip": false,
687
  "single_word": false
688
  },
689
  {
690
+ "content": "îa",
691
  "lstrip": false,
692
  "normalized": false,
693
  "rstrip": false,
694
  "single_word": false
695
  },
696
  {
697
+ "content": "[OBJECT:1ps]",
698
  "lstrip": false,
699
  "normalized": false,
700
  "rstrip": false,
701
  "single_word": false
702
  },
703
  {
704
+ "content": "[GERUND_SUFFIX:CLASS_2:DEFAULT]",
705
  "lstrip": false,
706
  "normalized": false,
707
  "rstrip": false,
708
  "single_word": false
709
  },
710
  {
711
+ "content": "[GERUND_SUFFIX:CLASS_2:NASAL_VOWEL_ENDING]",
712
  "lstrip": false,
713
  "normalized": false,
714
  "rstrip": false,
715
  "single_word": false
716
  },
717
  {
718
+ "content": "[SUBJECT_PREFIX:1ppi]",
719
  "lstrip": false,
720
  "normalized": false,
721
  "rstrip": false,
722
  "single_word": false
723
  },
724
  {
725
+ "content": "[SUBJECT_PREFIX:2ps]",
726
  "lstrip": false,
727
  "normalized": false,
728
  "rstrip": false,
729
  "single_word": false
730
  },
731
  {
732
+ "content": "s",
733
  "lstrip": false,
734
  "normalized": false,
735
  "rstrip": false,
tokenizer_config.json CHANGED
@@ -1683,111 +1683,111 @@
1683
  }
1684
  },
1685
  "additional_special_tokens": [
1686
- "e'ym",
 
 
 
1687
  "îepé",
1688
- "[ROOT]",
 
 
 
 
 
 
 
 
 
 
 
 
1689
  "[PLURIFORM_PREFIX:S]",
1690
- "[OBJECT:1ps]",
 
 
 
1691
  "[GERUND_SUFFIX:CLASS_1]",
1692
- "[OBJECT:2ps:SUBJECT_1P]",
1693
- "[NEGATION_PARTICLE:NA]",
1694
- "îe",
1695
- "́",
1696
- "amo",
1697
- "[GERUND_SUBJECT_PREFIX:1ppi]",
1698
- "îa",
1699
- "umẽ",
1700
- "[GERUND_SUBJECT_PREFIX:1ps]",
1701
- "o",
1702
- "[SUBJECT_PREFIX:1ppi]",
1703
  "[IMPERATIVE_PREFIX:2pp]",
 
1704
  "xe",
1705
- "[SUBJECT_PREFIX:1ps]",
1706
- "[PLURIFORM_PREFIX:R]",
1707
- "í",
1708
- "n'",
1709
- "[OBJECT:2pp:SUBJECT_1P]",
1710
- "[PERMISSIVE_PREFIX:CONSONANT]",
1711
  "[SUBJECT:1ps]",
1712
- "î",
1713
- "[SUBJECT:2ps]",
1714
- "[OBJECT_MARKER:3p:PLURIFORM_PREFIX:MONOSYLLABIC]",
1715
- "pe",
1716
- "[NEGATION_PREFIX]",
1717
- "[OBJECT:2pp]",
1718
- "abo",
1719
- "na",
1720
- "[GERUND_SUFFIX:CLASS_1:R]",
1721
- "[SUBJECT_PREFIX:3p]",
1722
- "[OBJECT:1ppi]",
1723
- "[NEGATION_PARTICLE:UME]",
1724
- "îandé",
1725
- "[GERUND_SUFFIX:CLASS_1:ORAL_VOWEL]",
1726
  "[NEGATION_SUFFIX:CONSONANT_ENDING]",
1727
- "[GERUND_SUBJECT_PREFIX:2pp]",
1728
- "[CIRCUMSTANTIAL_SUFFIX:CONSONANT_ENDING]",
1729
  "[GERUND_SUFFIX:CLASS_2:ORAL_VOWEL_ENDING]",
 
 
 
 
 
 
 
 
1730
  "[GERUND_SUBJECT_PREFIX:2ps]",
 
 
 
1731
  "gûi",
1732
- "ixé",
 
 
 
 
1733
  "namo",
1734
- "[OBJECT:3p]",
1735
- "ere",
1736
- "[SUBJECT:3p:DIRECT]",
1737
  "mo",
1738
- "[GERUND_SUFFIX:CLASS_2:NASAL_VOWEL_ENDING]",
1739
- "[SUBJECT:1ppe]",
1740
- "[GERUND_SUBJECT_PREFIX:3p]",
1741
- "[OBJECT_MARKER:3p:DEFAULT]",
1742
- "[SUBJECT:1ppi]",
1743
- "[GERUND_SUFFIX:CLASS_1:NASAL_VOWEL]",
1744
- "peẽ",
1745
- "s",
1746
- "[SUBJECT:3p]",
1747
- "û",
1748
- "[SUBJECT:2ps:OBJECT_1P]",
1749
- "îos",
1750
- "nde",
1751
- "endé",
1752
- "[OBJECT:MUTUAL]",
1753
- "[GERUND_SUFFIX:CLASS_1:CONSONANT]",
1754
- "oré",
1755
- "t",
1756
  "bo",
1757
- "[GERUND_SUFFIX:CLASS_1:IYU]",
 
 
 
 
 
1758
  "r",
1759
- "i",
 
 
 
 
1760
  "ramo",
1761
- "[OBJECT:1ppe]",
1762
- "[OBJECT:3p:MONOSYLLABIC]",
1763
- "ta",
1764
- "[SUBJECT_PREFIX:2ps]",
1765
- "a'e",
1766
- "[OBJECT:DIRECT]",
1767
- "peîepé",
1768
- "a",
1769
- "[GERUND_SUBJECT_PREFIX:1ppe]",
1770
- "[GERUND_SUFFIX:CLASS_2:DEFAULT]",
1771
- "[SUBJECT:2pp]",
1772
- "[GERUND_SUFFIX:CLASS_1:NASAL_IYU]",
1773
- "[OBJECT:2ps]",
1774
- "[SUBJECT_PREFIX:1ppe]",
1775
- "[NEGATION_SUFFIX]",
1776
- "e",
1777
- "[PERMISSIVE_PREFIX:VOWEL]",
1778
  "[OBJECT:REFLEXIVE]",
1779
- "pa",
1780
- "[SUBJECT_PREFIX:2pp]",
1781
  "[GERUND_SUFFIX:CLASS_1:B]",
1782
- "[SUBJECT:2pp:OBJECT_1P]",
 
 
 
1783
  "oro",
1784
- "[NEGATION_SUFFIX:VOWEL_ENDING]",
1785
- "[CIRCUMSTANTIAL_SUFFIX:VOWEL_ENDING]",
1786
- "[CIRCUMSTANTIAL_SUFFIX:NULL_ENDING]",
1787
- "[IMPERATIVE_PREFIX:2ps]",
1788
- "[OBJECT_MARKER:3p:MONOSYLLABIC]",
1789
- "opo",
1790
- "îo",
 
 
 
 
 
 
 
 
1791
  "[SPACE]"
1792
  ],
1793
  "clean_up_tokenization_spaces": true,
 
1683
  }
1684
  },
1685
  "additional_special_tokens": [
1686
+ "[SUBJECT:3p:DIRECT]",
1687
+ "[GERUND_SUBJECT_PREFIX:1ppi]",
1688
+ "[OBJECT:DIRECT]",
1689
+ "î",
1690
  "îepé",
1691
+ "e",
1692
+ "[OBJECT:2pp]",
1693
+ "ta",
1694
+ "n'",
1695
+ "peẽ",
1696
+ "[SUBJECT:2pp]",
1697
+ "îe",
1698
+ "[GERUND_SUBJECT_PREFIX:3p]",
1699
+ "[GERUND_SUBJECT_PREFIX:2pp]",
1700
+ "[NEGATION_PARTICLE:NA]",
1701
+ "[IMPERATIVE_PREFIX:2ps]",
1702
+ "îos",
1703
+ "[GERUND_SUFFIX:CLASS_1:NASAL_IYU]",
1704
  "[PLURIFORM_PREFIX:S]",
1705
+ "û",
1706
+ "[OBJECT_MARKER:3p:PLURIFORM_PREFIX:MONOSYLLABIC]",
1707
+ "[OBJECT:1ppi]",
1708
+ "abo",
1709
  "[GERUND_SUFFIX:CLASS_1]",
1710
+ "[GERUND_SUFFIX:CLASS_1:IYU]",
1711
+ "îo",
1712
+ "[NEGATION_SUFFIX]",
1713
+ "i",
1714
+ "[GERUND_SUBJECT_PREFIX:1ppe]",
1715
+ "[SUBJECT:3p]",
 
 
 
 
 
1716
  "[IMPERATIVE_PREFIX:2pp]",
1717
+ "́",
1718
  "xe",
1719
+ "a'e",
1720
+ "t",
 
 
 
 
1721
  "[SUBJECT:1ps]",
1722
+ "[SUBJECT:1ppe]",
1723
+ "a",
1724
+ "[SUBJECT_PREFIX:1ppe]",
1725
+ "amo",
1726
+ "[OBJECT:2ps]",
1727
+ "[OBJECT:1ppe]",
 
 
 
 
 
 
 
 
1728
  "[NEGATION_SUFFIX:CONSONANT_ENDING]",
1729
+ "[OBJECT:MUTUAL]",
 
1730
  "[GERUND_SUFFIX:CLASS_2:ORAL_VOWEL_ENDING]",
1731
+ "[NEGATION_PREFIX]",
1732
+ "[CIRCUMSTANTIAL_SUFFIX:NULL_ENDING]",
1733
+ "[SUBJECT:1ppi]",
1734
+ "[PERMISSIVE_PREFIX:VOWEL]",
1735
+ "pe",
1736
+ "nde",
1737
+ "opo",
1738
+ "[OBJECT_MARKER:3p:DEFAULT]",
1739
  "[GERUND_SUBJECT_PREFIX:2ps]",
1740
+ "[OBJECT:3p]",
1741
+ "îandé",
1742
+ "[OBJECT:2pp:SUBJECT_1P]",
1743
  "gûi",
1744
+ "[CIRCUMSTANTIAL_SUFFIX:VOWEL_ENDING]",
1745
+ "[OBJECT_MARKER:3p:MONOSYLLABIC]",
1746
+ "peîepé",
1747
+ "[GERUND_SUFFIX:CLASS_1:R]",
1748
+ "endé",
1749
  "namo",
1750
+ "[SUBJECT:2pp:OBJECT_1P]",
 
 
1751
  "mo",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1752
  "bo",
1753
+ "[SUBJECT_PREFIX:2pp]",
1754
+ "[CIRCUMSTANTIAL_SUFFIX:CONSONANT_ENDING]",
1755
+ "[ROOT]",
1756
+ "[NEGATION_PARTICLE:UME]",
1757
+ "e'ym",
1758
+ "[SUBJECT_PREFIX:3p]",
1759
  "r",
1760
+ "[NEGATION_SUFFIX:VOWEL_ENDING]",
1761
+ "[SUBJECT_PREFIX:1ps]",
1762
+ "[GERUND_SUFFIX:CLASS_1:ORAL_VOWEL]",
1763
+ "ixé",
1764
+ "pa",
1765
  "ramo",
1766
+ "ere",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1767
  "[OBJECT:REFLEXIVE]",
1768
+ "[GERUND_SUFFIX:CLASS_1:NASAL_VOWEL]",
1769
+ "na",
1770
  "[GERUND_SUFFIX:CLASS_1:B]",
1771
+ "[OBJECT:3p:MONOSYLLABIC]",
1772
+ "[GERUND_SUFFIX:CLASS_1:CONSONANT]",
1773
+ "[OBJECT:2ps:SUBJECT_1P]",
1774
+ "[GERUND_SUBJECT_PREFIX:1ps]",
1775
  "oro",
1776
+ "[PERMISSIVE_PREFIX:CONSONANT]",
1777
+ "í",
1778
+ "oré",
1779
+ "umẽ",
1780
+ "[SUBJECT:2ps]",
1781
+ "[PLURIFORM_PREFIX:R]",
1782
+ "o",
1783
+ "[SUBJECT:2ps:OBJECT_1P]",
1784
+ "îa",
1785
+ "[OBJECT:1ps]",
1786
+ "[GERUND_SUFFIX:CLASS_2:DEFAULT]",
1787
+ "[GERUND_SUFFIX:CLASS_2:NASAL_VOWEL_ENDING]",
1788
+ "[SUBJECT_PREFIX:1ppi]",
1789
+ "[SUBJECT_PREFIX:2ps]",
1790
+ "s",
1791
  "[SPACE]"
1792
  ],
1793
  "clean_up_tokenization_spaces": true,