bilguun commited on
Commit
ccf73fc
1 Parent(s): 0595a97

Upload tokenizer

Browse files
Files changed (3) hide show
  1. spiece.model +2 -2
  2. tokenizer.json +0 -0
  3. tokenizer_config.json +100 -100
spiece.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:829ed13b97a7ef734aaf095db01da9557aa389fffa99c9a85d483ada98a4bbe6
3
- size 413481
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8674db3129dcc5bae3065822cdbbde6b79939ace7a837cc91ded51c6bc51bba2
3
+ size 321146
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -33,7 +33,7 @@
33
  "single_word": false,
34
  "special": true
35
  },
36
- "8000": {
37
  "content": "<extra_id_99>",
38
  "lstrip": false,
39
  "normalized": false,
@@ -41,7 +41,7 @@
41
  "single_word": false,
42
  "special": true
43
  },
44
- "8001": {
45
  "content": "<extra_id_98>",
46
  "lstrip": false,
47
  "normalized": false,
@@ -49,7 +49,7 @@
49
  "single_word": false,
50
  "special": true
51
  },
52
- "8002": {
53
  "content": "<extra_id_97>",
54
  "lstrip": false,
55
  "normalized": false,
@@ -57,7 +57,7 @@
57
  "single_word": false,
58
  "special": true
59
  },
60
- "8003": {
61
  "content": "<extra_id_96>",
62
  "lstrip": false,
63
  "normalized": false,
@@ -65,7 +65,7 @@
65
  "single_word": false,
66
  "special": true
67
  },
68
- "8004": {
69
  "content": "<extra_id_95>",
70
  "lstrip": false,
71
  "normalized": false,
@@ -73,7 +73,7 @@
73
  "single_word": false,
74
  "special": true
75
  },
76
- "8005": {
77
  "content": "<extra_id_94>",
78
  "lstrip": false,
79
  "normalized": false,
@@ -81,7 +81,7 @@
81
  "single_word": false,
82
  "special": true
83
  },
84
- "8006": {
85
  "content": "<extra_id_93>",
86
  "lstrip": false,
87
  "normalized": false,
@@ -89,7 +89,7 @@
89
  "single_word": false,
90
  "special": true
91
  },
92
- "8007": {
93
  "content": "<extra_id_92>",
94
  "lstrip": false,
95
  "normalized": false,
@@ -97,7 +97,7 @@
97
  "single_word": false,
98
  "special": true
99
  },
100
- "8008": {
101
  "content": "<extra_id_91>",
102
  "lstrip": false,
103
  "normalized": false,
@@ -105,7 +105,7 @@
105
  "single_word": false,
106
  "special": true
107
  },
108
- "8009": {
109
  "content": "<extra_id_90>",
110
  "lstrip": false,
111
  "normalized": false,
@@ -113,7 +113,7 @@
113
  "single_word": false,
114
  "special": true
115
  },
116
- "8010": {
117
  "content": "<extra_id_89>",
118
  "lstrip": false,
119
  "normalized": false,
@@ -121,7 +121,7 @@
121
  "single_word": false,
122
  "special": true
123
  },
124
- "8011": {
125
  "content": "<extra_id_88>",
126
  "lstrip": false,
127
  "normalized": false,
@@ -129,7 +129,7 @@
129
  "single_word": false,
130
  "special": true
131
  },
132
- "8012": {
133
  "content": "<extra_id_87>",
134
  "lstrip": false,
135
  "normalized": false,
@@ -137,7 +137,7 @@
137
  "single_word": false,
138
  "special": true
139
  },
140
- "8013": {
141
  "content": "<extra_id_86>",
142
  "lstrip": false,
143
  "normalized": false,
@@ -145,7 +145,7 @@
145
  "single_word": false,
146
  "special": true
147
  },
148
- "8014": {
149
  "content": "<extra_id_85>",
150
  "lstrip": false,
151
  "normalized": false,
@@ -153,7 +153,7 @@
153
  "single_word": false,
154
  "special": true
155
  },
156
- "8015": {
157
  "content": "<extra_id_84>",
158
  "lstrip": false,
159
  "normalized": false,
@@ -161,7 +161,7 @@
161
  "single_word": false,
162
  "special": true
163
  },
164
- "8016": {
165
  "content": "<extra_id_83>",
166
  "lstrip": false,
167
  "normalized": false,
@@ -169,7 +169,7 @@
169
  "single_word": false,
170
  "special": true
171
  },
172
- "8017": {
173
  "content": "<extra_id_82>",
174
  "lstrip": false,
175
  "normalized": false,
@@ -177,7 +177,7 @@
177
  "single_word": false,
178
  "special": true
179
  },
180
- "8018": {
181
  "content": "<extra_id_81>",
182
  "lstrip": false,
183
  "normalized": false,
@@ -185,7 +185,7 @@
185
  "single_word": false,
186
  "special": true
187
  },
188
- "8019": {
189
  "content": "<extra_id_80>",
190
  "lstrip": false,
191
  "normalized": false,
@@ -193,7 +193,7 @@
193
  "single_word": false,
194
  "special": true
195
  },
196
- "8020": {
197
  "content": "<extra_id_79>",
198
  "lstrip": false,
199
  "normalized": false,
@@ -201,7 +201,7 @@
201
  "single_word": false,
202
  "special": true
203
  },
204
- "8021": {
205
  "content": "<extra_id_78>",
206
  "lstrip": false,
207
  "normalized": false,
@@ -209,7 +209,7 @@
209
  "single_word": false,
210
  "special": true
211
  },
212
- "8022": {
213
  "content": "<extra_id_77>",
214
  "lstrip": false,
215
  "normalized": false,
@@ -217,7 +217,7 @@
217
  "single_word": false,
218
  "special": true
219
  },
220
- "8023": {
221
  "content": "<extra_id_76>",
222
  "lstrip": false,
223
  "normalized": false,
@@ -225,7 +225,7 @@
225
  "single_word": false,
226
  "special": true
227
  },
228
- "8024": {
229
  "content": "<extra_id_75>",
230
  "lstrip": false,
231
  "normalized": false,
@@ -233,7 +233,7 @@
233
  "single_word": false,
234
  "special": true
235
  },
236
- "8025": {
237
  "content": "<extra_id_74>",
238
  "lstrip": false,
239
  "normalized": false,
@@ -241,7 +241,7 @@
241
  "single_word": false,
242
  "special": true
243
  },
244
- "8026": {
245
  "content": "<extra_id_73>",
246
  "lstrip": false,
247
  "normalized": false,
@@ -249,7 +249,7 @@
249
  "single_word": false,
250
  "special": true
251
  },
252
- "8027": {
253
  "content": "<extra_id_72>",
254
  "lstrip": false,
255
  "normalized": false,
@@ -257,7 +257,7 @@
257
  "single_word": false,
258
  "special": true
259
  },
260
- "8028": {
261
  "content": "<extra_id_71>",
262
  "lstrip": false,
263
  "normalized": false,
@@ -265,7 +265,7 @@
265
  "single_word": false,
266
  "special": true
267
  },
268
- "8029": {
269
  "content": "<extra_id_70>",
270
  "lstrip": false,
271
  "normalized": false,
@@ -273,7 +273,7 @@
273
  "single_word": false,
274
  "special": true
275
  },
276
- "8030": {
277
  "content": "<extra_id_69>",
278
  "lstrip": false,
279
  "normalized": false,
@@ -281,7 +281,7 @@
281
  "single_word": false,
282
  "special": true
283
  },
284
- "8031": {
285
  "content": "<extra_id_68>",
286
  "lstrip": false,
287
  "normalized": false,
@@ -289,7 +289,7 @@
289
  "single_word": false,
290
  "special": true
291
  },
292
- "8032": {
293
  "content": "<extra_id_67>",
294
  "lstrip": false,
295
  "normalized": false,
@@ -297,7 +297,7 @@
297
  "single_word": false,
298
  "special": true
299
  },
300
- "8033": {
301
  "content": "<extra_id_66>",
302
  "lstrip": false,
303
  "normalized": false,
@@ -305,7 +305,7 @@
305
  "single_word": false,
306
  "special": true
307
  },
308
- "8034": {
309
  "content": "<extra_id_65>",
310
  "lstrip": false,
311
  "normalized": false,
@@ -313,7 +313,7 @@
313
  "single_word": false,
314
  "special": true
315
  },
316
- "8035": {
317
  "content": "<extra_id_64>",
318
  "lstrip": false,
319
  "normalized": false,
@@ -321,7 +321,7 @@
321
  "single_word": false,
322
  "special": true
323
  },
324
- "8036": {
325
  "content": "<extra_id_63>",
326
  "lstrip": false,
327
  "normalized": false,
@@ -329,7 +329,7 @@
329
  "single_word": false,
330
  "special": true
331
  },
332
- "8037": {
333
  "content": "<extra_id_62>",
334
  "lstrip": false,
335
  "normalized": false,
@@ -337,7 +337,7 @@
337
  "single_word": false,
338
  "special": true
339
  },
340
- "8038": {
341
  "content": "<extra_id_61>",
342
  "lstrip": false,
343
  "normalized": false,
@@ -345,7 +345,7 @@
345
  "single_word": false,
346
  "special": true
347
  },
348
- "8039": {
349
  "content": "<extra_id_60>",
350
  "lstrip": false,
351
  "normalized": false,
@@ -353,7 +353,7 @@
353
  "single_word": false,
354
  "special": true
355
  },
356
- "8040": {
357
  "content": "<extra_id_59>",
358
  "lstrip": false,
359
  "normalized": false,
@@ -361,7 +361,7 @@
361
  "single_word": false,
362
  "special": true
363
  },
364
- "8041": {
365
  "content": "<extra_id_58>",
366
  "lstrip": false,
367
  "normalized": false,
@@ -369,7 +369,7 @@
369
  "single_word": false,
370
  "special": true
371
  },
372
- "8042": {
373
  "content": "<extra_id_57>",
374
  "lstrip": false,
375
  "normalized": false,
@@ -377,7 +377,7 @@
377
  "single_word": false,
378
  "special": true
379
  },
380
- "8043": {
381
  "content": "<extra_id_56>",
382
  "lstrip": false,
383
  "normalized": false,
@@ -385,7 +385,7 @@
385
  "single_word": false,
386
  "special": true
387
  },
388
- "8044": {
389
  "content": "<extra_id_55>",
390
  "lstrip": false,
391
  "normalized": false,
@@ -393,7 +393,7 @@
393
  "single_word": false,
394
  "special": true
395
  },
396
- "8045": {
397
  "content": "<extra_id_54>",
398
  "lstrip": false,
399
  "normalized": false,
@@ -401,7 +401,7 @@
401
  "single_word": false,
402
  "special": true
403
  },
404
- "8046": {
405
  "content": "<extra_id_53>",
406
  "lstrip": false,
407
  "normalized": false,
@@ -409,7 +409,7 @@
409
  "single_word": false,
410
  "special": true
411
  },
412
- "8047": {
413
  "content": "<extra_id_52>",
414
  "lstrip": false,
415
  "normalized": false,
@@ -417,7 +417,7 @@
417
  "single_word": false,
418
  "special": true
419
  },
420
- "8048": {
421
  "content": "<extra_id_51>",
422
  "lstrip": false,
423
  "normalized": false,
@@ -425,7 +425,7 @@
425
  "single_word": false,
426
  "special": true
427
  },
428
- "8049": {
429
  "content": "<extra_id_50>",
430
  "lstrip": false,
431
  "normalized": false,
@@ -433,7 +433,7 @@
433
  "single_word": false,
434
  "special": true
435
  },
436
- "8050": {
437
  "content": "<extra_id_49>",
438
  "lstrip": false,
439
  "normalized": false,
@@ -441,7 +441,7 @@
441
  "single_word": false,
442
  "special": true
443
  },
444
- "8051": {
445
  "content": "<extra_id_48>",
446
  "lstrip": false,
447
  "normalized": false,
@@ -449,7 +449,7 @@
449
  "single_word": false,
450
  "special": true
451
  },
452
- "8052": {
453
  "content": "<extra_id_47>",
454
  "lstrip": false,
455
  "normalized": false,
@@ -457,7 +457,7 @@
457
  "single_word": false,
458
  "special": true
459
  },
460
- "8053": {
461
  "content": "<extra_id_46>",
462
  "lstrip": false,
463
  "normalized": false,
@@ -465,7 +465,7 @@
465
  "single_word": false,
466
  "special": true
467
  },
468
- "8054": {
469
  "content": "<extra_id_45>",
470
  "lstrip": false,
471
  "normalized": false,
@@ -473,7 +473,7 @@
473
  "single_word": false,
474
  "special": true
475
  },
476
- "8055": {
477
  "content": "<extra_id_44>",
478
  "lstrip": false,
479
  "normalized": false,
@@ -481,7 +481,7 @@
481
  "single_word": false,
482
  "special": true
483
  },
484
- "8056": {
485
  "content": "<extra_id_43>",
486
  "lstrip": false,
487
  "normalized": false,
@@ -489,7 +489,7 @@
489
  "single_word": false,
490
  "special": true
491
  },
492
- "8057": {
493
  "content": "<extra_id_42>",
494
  "lstrip": false,
495
  "normalized": false,
@@ -497,7 +497,7 @@
497
  "single_word": false,
498
  "special": true
499
  },
500
- "8058": {
501
  "content": "<extra_id_41>",
502
  "lstrip": false,
503
  "normalized": false,
@@ -505,7 +505,7 @@
505
  "single_word": false,
506
  "special": true
507
  },
508
- "8059": {
509
  "content": "<extra_id_40>",
510
  "lstrip": false,
511
  "normalized": false,
@@ -513,7 +513,7 @@
513
  "single_word": false,
514
  "special": true
515
  },
516
- "8060": {
517
  "content": "<extra_id_39>",
518
  "lstrip": false,
519
  "normalized": false,
@@ -521,7 +521,7 @@
521
  "single_word": false,
522
  "special": true
523
  },
524
- "8061": {
525
  "content": "<extra_id_38>",
526
  "lstrip": false,
527
  "normalized": false,
@@ -529,7 +529,7 @@
529
  "single_word": false,
530
  "special": true
531
  },
532
- "8062": {
533
  "content": "<extra_id_37>",
534
  "lstrip": false,
535
  "normalized": false,
@@ -537,7 +537,7 @@
537
  "single_word": false,
538
  "special": true
539
  },
540
- "8063": {
541
  "content": "<extra_id_36>",
542
  "lstrip": false,
543
  "normalized": false,
@@ -545,7 +545,7 @@
545
  "single_word": false,
546
  "special": true
547
  },
548
- "8064": {
549
  "content": "<extra_id_35>",
550
  "lstrip": false,
551
  "normalized": false,
@@ -553,7 +553,7 @@
553
  "single_word": false,
554
  "special": true
555
  },
556
- "8065": {
557
  "content": "<extra_id_34>",
558
  "lstrip": false,
559
  "normalized": false,
@@ -561,7 +561,7 @@
561
  "single_word": false,
562
  "special": true
563
  },
564
- "8066": {
565
  "content": "<extra_id_33>",
566
  "lstrip": false,
567
  "normalized": false,
@@ -569,7 +569,7 @@
569
  "single_word": false,
570
  "special": true
571
  },
572
- "8067": {
573
  "content": "<extra_id_32>",
574
  "lstrip": false,
575
  "normalized": false,
@@ -577,7 +577,7 @@
577
  "single_word": false,
578
  "special": true
579
  },
580
- "8068": {
581
  "content": "<extra_id_31>",
582
  "lstrip": false,
583
  "normalized": false,
@@ -585,7 +585,7 @@
585
  "single_word": false,
586
  "special": true
587
  },
588
- "8069": {
589
  "content": "<extra_id_30>",
590
  "lstrip": false,
591
  "normalized": false,
@@ -593,7 +593,7 @@
593
  "single_word": false,
594
  "special": true
595
  },
596
- "8070": {
597
  "content": "<extra_id_29>",
598
  "lstrip": false,
599
  "normalized": false,
@@ -601,7 +601,7 @@
601
  "single_word": false,
602
  "special": true
603
  },
604
- "8071": {
605
  "content": "<extra_id_28>",
606
  "lstrip": false,
607
  "normalized": false,
@@ -609,7 +609,7 @@
609
  "single_word": false,
610
  "special": true
611
  },
612
- "8072": {
613
  "content": "<extra_id_27>",
614
  "lstrip": false,
615
  "normalized": false,
@@ -617,7 +617,7 @@
617
  "single_word": false,
618
  "special": true
619
  },
620
- "8073": {
621
  "content": "<extra_id_26>",
622
  "lstrip": false,
623
  "normalized": false,
@@ -625,7 +625,7 @@
625
  "single_word": false,
626
  "special": true
627
  },
628
- "8074": {
629
  "content": "<extra_id_25>",
630
  "lstrip": false,
631
  "normalized": false,
@@ -633,7 +633,7 @@
633
  "single_word": false,
634
  "special": true
635
  },
636
- "8075": {
637
  "content": "<extra_id_24>",
638
  "lstrip": false,
639
  "normalized": false,
@@ -641,7 +641,7 @@
641
  "single_word": false,
642
  "special": true
643
  },
644
- "8076": {
645
  "content": "<extra_id_23>",
646
  "lstrip": false,
647
  "normalized": false,
@@ -649,7 +649,7 @@
649
  "single_word": false,
650
  "special": true
651
  },
652
- "8077": {
653
  "content": "<extra_id_22>",
654
  "lstrip": false,
655
  "normalized": false,
@@ -657,7 +657,7 @@
657
  "single_word": false,
658
  "special": true
659
  },
660
- "8078": {
661
  "content": "<extra_id_21>",
662
  "lstrip": false,
663
  "normalized": false,
@@ -665,7 +665,7 @@
665
  "single_word": false,
666
  "special": true
667
  },
668
- "8079": {
669
  "content": "<extra_id_20>",
670
  "lstrip": false,
671
  "normalized": false,
@@ -673,7 +673,7 @@
673
  "single_word": false,
674
  "special": true
675
  },
676
- "8080": {
677
  "content": "<extra_id_19>",
678
  "lstrip": false,
679
  "normalized": false,
@@ -681,7 +681,7 @@
681
  "single_word": false,
682
  "special": true
683
  },
684
- "8081": {
685
  "content": "<extra_id_18>",
686
  "lstrip": false,
687
  "normalized": false,
@@ -689,7 +689,7 @@
689
  "single_word": false,
690
  "special": true
691
  },
692
- "8082": {
693
  "content": "<extra_id_17>",
694
  "lstrip": false,
695
  "normalized": false,
@@ -697,7 +697,7 @@
697
  "single_word": false,
698
  "special": true
699
  },
700
- "8083": {
701
  "content": "<extra_id_16>",
702
  "lstrip": false,
703
  "normalized": false,
@@ -705,7 +705,7 @@
705
  "single_word": false,
706
  "special": true
707
  },
708
- "8084": {
709
  "content": "<extra_id_15>",
710
  "lstrip": false,
711
  "normalized": false,
@@ -713,7 +713,7 @@
713
  "single_word": false,
714
  "special": true
715
  },
716
- "8085": {
717
  "content": "<extra_id_14>",
718
  "lstrip": false,
719
  "normalized": false,
@@ -721,7 +721,7 @@
721
  "single_word": false,
722
  "special": true
723
  },
724
- "8086": {
725
  "content": "<extra_id_13>",
726
  "lstrip": false,
727
  "normalized": false,
@@ -729,7 +729,7 @@
729
  "single_word": false,
730
  "special": true
731
  },
732
- "8087": {
733
  "content": "<extra_id_12>",
734
  "lstrip": false,
735
  "normalized": false,
@@ -737,7 +737,7 @@
737
  "single_word": false,
738
  "special": true
739
  },
740
- "8088": {
741
  "content": "<extra_id_11>",
742
  "lstrip": false,
743
  "normalized": false,
@@ -745,7 +745,7 @@
745
  "single_word": false,
746
  "special": true
747
  },
748
- "8089": {
749
  "content": "<extra_id_10>",
750
  "lstrip": false,
751
  "normalized": false,
@@ -753,7 +753,7 @@
753
  "single_word": false,
754
  "special": true
755
  },
756
- "8090": {
757
  "content": "<extra_id_9>",
758
  "lstrip": false,
759
  "normalized": false,
@@ -761,7 +761,7 @@
761
  "single_word": false,
762
  "special": true
763
  },
764
- "8091": {
765
  "content": "<extra_id_8>",
766
  "lstrip": false,
767
  "normalized": false,
@@ -769,7 +769,7 @@
769
  "single_word": false,
770
  "special": true
771
  },
772
- "8092": {
773
  "content": "<extra_id_7>",
774
  "lstrip": false,
775
  "normalized": false,
@@ -777,7 +777,7 @@
777
  "single_word": false,
778
  "special": true
779
  },
780
- "8093": {
781
  "content": "<extra_id_6>",
782
  "lstrip": false,
783
  "normalized": false,
@@ -785,7 +785,7 @@
785
  "single_word": false,
786
  "special": true
787
  },
788
- "8094": {
789
  "content": "<extra_id_5>",
790
  "lstrip": false,
791
  "normalized": false,
@@ -793,7 +793,7 @@
793
  "single_word": false,
794
  "special": true
795
  },
796
- "8095": {
797
  "content": "<extra_id_4>",
798
  "lstrip": false,
799
  "normalized": false,
@@ -801,7 +801,7 @@
801
  "single_word": false,
802
  "special": true
803
  },
804
- "8096": {
805
  "content": "<extra_id_3>",
806
  "lstrip": false,
807
  "normalized": false,
@@ -809,7 +809,7 @@
809
  "single_word": false,
810
  "special": true
811
  },
812
- "8097": {
813
  "content": "<extra_id_2>",
814
  "lstrip": false,
815
  "normalized": false,
@@ -817,7 +817,7 @@
817
  "single_word": false,
818
  "special": true
819
  },
820
- "8098": {
821
  "content": "<extra_id_1>",
822
  "lstrip": false,
823
  "normalized": false,
@@ -825,7 +825,7 @@
825
  "single_word": false,
826
  "special": true
827
  },
828
- "8099": {
829
  "content": "<extra_id_0>",
830
  "lstrip": false,
831
  "normalized": false,
 
33
  "single_word": false,
34
  "special": true
35
  },
36
+ "4000": {
37
  "content": "<extra_id_99>",
38
  "lstrip": false,
39
  "normalized": false,
 
41
  "single_word": false,
42
  "special": true
43
  },
44
+ "4001": {
45
  "content": "<extra_id_98>",
46
  "lstrip": false,
47
  "normalized": false,
 
49
  "single_word": false,
50
  "special": true
51
  },
52
+ "4002": {
53
  "content": "<extra_id_97>",
54
  "lstrip": false,
55
  "normalized": false,
 
57
  "single_word": false,
58
  "special": true
59
  },
60
+ "4003": {
61
  "content": "<extra_id_96>",
62
  "lstrip": false,
63
  "normalized": false,
 
65
  "single_word": false,
66
  "special": true
67
  },
68
+ "4004": {
69
  "content": "<extra_id_95>",
70
  "lstrip": false,
71
  "normalized": false,
 
73
  "single_word": false,
74
  "special": true
75
  },
76
+ "4005": {
77
  "content": "<extra_id_94>",
78
  "lstrip": false,
79
  "normalized": false,
 
81
  "single_word": false,
82
  "special": true
83
  },
84
+ "4006": {
85
  "content": "<extra_id_93>",
86
  "lstrip": false,
87
  "normalized": false,
 
89
  "single_word": false,
90
  "special": true
91
  },
92
+ "4007": {
93
  "content": "<extra_id_92>",
94
  "lstrip": false,
95
  "normalized": false,
 
97
  "single_word": false,
98
  "special": true
99
  },
100
+ "4008": {
101
  "content": "<extra_id_91>",
102
  "lstrip": false,
103
  "normalized": false,
 
105
  "single_word": false,
106
  "special": true
107
  },
108
+ "4009": {
109
  "content": "<extra_id_90>",
110
  "lstrip": false,
111
  "normalized": false,
 
113
  "single_word": false,
114
  "special": true
115
  },
116
+ "4010": {
117
  "content": "<extra_id_89>",
118
  "lstrip": false,
119
  "normalized": false,
 
121
  "single_word": false,
122
  "special": true
123
  },
124
+ "4011": {
125
  "content": "<extra_id_88>",
126
  "lstrip": false,
127
  "normalized": false,
 
129
  "single_word": false,
130
  "special": true
131
  },
132
+ "4012": {
133
  "content": "<extra_id_87>",
134
  "lstrip": false,
135
  "normalized": false,
 
137
  "single_word": false,
138
  "special": true
139
  },
140
+ "4013": {
141
  "content": "<extra_id_86>",
142
  "lstrip": false,
143
  "normalized": false,
 
145
  "single_word": false,
146
  "special": true
147
  },
148
+ "4014": {
149
  "content": "<extra_id_85>",
150
  "lstrip": false,
151
  "normalized": false,
 
153
  "single_word": false,
154
  "special": true
155
  },
156
+ "4015": {
157
  "content": "<extra_id_84>",
158
  "lstrip": false,
159
  "normalized": false,
 
161
  "single_word": false,
162
  "special": true
163
  },
164
+ "4016": {
165
  "content": "<extra_id_83>",
166
  "lstrip": false,
167
  "normalized": false,
 
169
  "single_word": false,
170
  "special": true
171
  },
172
+ "4017": {
173
  "content": "<extra_id_82>",
174
  "lstrip": false,
175
  "normalized": false,
 
177
  "single_word": false,
178
  "special": true
179
  },
180
+ "4018": {
181
  "content": "<extra_id_81>",
182
  "lstrip": false,
183
  "normalized": false,
 
185
  "single_word": false,
186
  "special": true
187
  },
188
+ "4019": {
189
  "content": "<extra_id_80>",
190
  "lstrip": false,
191
  "normalized": false,
 
193
  "single_word": false,
194
  "special": true
195
  },
196
+ "4020": {
197
  "content": "<extra_id_79>",
198
  "lstrip": false,
199
  "normalized": false,
 
201
  "single_word": false,
202
  "special": true
203
  },
204
+ "4021": {
205
  "content": "<extra_id_78>",
206
  "lstrip": false,
207
  "normalized": false,
 
209
  "single_word": false,
210
  "special": true
211
  },
212
+ "4022": {
213
  "content": "<extra_id_77>",
214
  "lstrip": false,
215
  "normalized": false,
 
217
  "single_word": false,
218
  "special": true
219
  },
220
+ "4023": {
221
  "content": "<extra_id_76>",
222
  "lstrip": false,
223
  "normalized": false,
 
225
  "single_word": false,
226
  "special": true
227
  },
228
+ "4024": {
229
  "content": "<extra_id_75>",
230
  "lstrip": false,
231
  "normalized": false,
 
233
  "single_word": false,
234
  "special": true
235
  },
236
+ "4025": {
237
  "content": "<extra_id_74>",
238
  "lstrip": false,
239
  "normalized": false,
 
241
  "single_word": false,
242
  "special": true
243
  },
244
+ "4026": {
245
  "content": "<extra_id_73>",
246
  "lstrip": false,
247
  "normalized": false,
 
249
  "single_word": false,
250
  "special": true
251
  },
252
+ "4027": {
253
  "content": "<extra_id_72>",
254
  "lstrip": false,
255
  "normalized": false,
 
257
  "single_word": false,
258
  "special": true
259
  },
260
+ "4028": {
261
  "content": "<extra_id_71>",
262
  "lstrip": false,
263
  "normalized": false,
 
265
  "single_word": false,
266
  "special": true
267
  },
268
+ "4029": {
269
  "content": "<extra_id_70>",
270
  "lstrip": false,
271
  "normalized": false,
 
273
  "single_word": false,
274
  "special": true
275
  },
276
+ "4030": {
277
  "content": "<extra_id_69>",
278
  "lstrip": false,
279
  "normalized": false,
 
281
  "single_word": false,
282
  "special": true
283
  },
284
+ "4031": {
285
  "content": "<extra_id_68>",
286
  "lstrip": false,
287
  "normalized": false,
 
289
  "single_word": false,
290
  "special": true
291
  },
292
+ "4032": {
293
  "content": "<extra_id_67>",
294
  "lstrip": false,
295
  "normalized": false,
 
297
  "single_word": false,
298
  "special": true
299
  },
300
+ "4033": {
301
  "content": "<extra_id_66>",
302
  "lstrip": false,
303
  "normalized": false,
 
305
  "single_word": false,
306
  "special": true
307
  },
308
+ "4034": {
309
  "content": "<extra_id_65>",
310
  "lstrip": false,
311
  "normalized": false,
 
313
  "single_word": false,
314
  "special": true
315
  },
316
+ "4035": {
317
  "content": "<extra_id_64>",
318
  "lstrip": false,
319
  "normalized": false,
 
321
  "single_word": false,
322
  "special": true
323
  },
324
+ "4036": {
325
  "content": "<extra_id_63>",
326
  "lstrip": false,
327
  "normalized": false,
 
329
  "single_word": false,
330
  "special": true
331
  },
332
+ "4037": {
333
  "content": "<extra_id_62>",
334
  "lstrip": false,
335
  "normalized": false,
 
337
  "single_word": false,
338
  "special": true
339
  },
340
+ "4038": {
341
  "content": "<extra_id_61>",
342
  "lstrip": false,
343
  "normalized": false,
 
345
  "single_word": false,
346
  "special": true
347
  },
348
+ "4039": {
349
  "content": "<extra_id_60>",
350
  "lstrip": false,
351
  "normalized": false,
 
353
  "single_word": false,
354
  "special": true
355
  },
356
+ "4040": {
357
  "content": "<extra_id_59>",
358
  "lstrip": false,
359
  "normalized": false,
 
361
  "single_word": false,
362
  "special": true
363
  },
364
+ "4041": {
365
  "content": "<extra_id_58>",
366
  "lstrip": false,
367
  "normalized": false,
 
369
  "single_word": false,
370
  "special": true
371
  },
372
+ "4042": {
373
  "content": "<extra_id_57>",
374
  "lstrip": false,
375
  "normalized": false,
 
377
  "single_word": false,
378
  "special": true
379
  },
380
+ "4043": {
381
  "content": "<extra_id_56>",
382
  "lstrip": false,
383
  "normalized": false,
 
385
  "single_word": false,
386
  "special": true
387
  },
388
+ "4044": {
389
  "content": "<extra_id_55>",
390
  "lstrip": false,
391
  "normalized": false,
 
393
  "single_word": false,
394
  "special": true
395
  },
396
+ "4045": {
397
  "content": "<extra_id_54>",
398
  "lstrip": false,
399
  "normalized": false,
 
401
  "single_word": false,
402
  "special": true
403
  },
404
+ "4046": {
405
  "content": "<extra_id_53>",
406
  "lstrip": false,
407
  "normalized": false,
 
409
  "single_word": false,
410
  "special": true
411
  },
412
+ "4047": {
413
  "content": "<extra_id_52>",
414
  "lstrip": false,
415
  "normalized": false,
 
417
  "single_word": false,
418
  "special": true
419
  },
420
+ "4048": {
421
  "content": "<extra_id_51>",
422
  "lstrip": false,
423
  "normalized": false,
 
425
  "single_word": false,
426
  "special": true
427
  },
428
+ "4049": {
429
  "content": "<extra_id_50>",
430
  "lstrip": false,
431
  "normalized": false,
 
433
  "single_word": false,
434
  "special": true
435
  },
436
+ "4050": {
437
  "content": "<extra_id_49>",
438
  "lstrip": false,
439
  "normalized": false,
 
441
  "single_word": false,
442
  "special": true
443
  },
444
+ "4051": {
445
  "content": "<extra_id_48>",
446
  "lstrip": false,
447
  "normalized": false,
 
449
  "single_word": false,
450
  "special": true
451
  },
452
+ "4052": {
453
  "content": "<extra_id_47>",
454
  "lstrip": false,
455
  "normalized": false,
 
457
  "single_word": false,
458
  "special": true
459
  },
460
+ "4053": {
461
  "content": "<extra_id_46>",
462
  "lstrip": false,
463
  "normalized": false,
 
465
  "single_word": false,
466
  "special": true
467
  },
468
+ "4054": {
469
  "content": "<extra_id_45>",
470
  "lstrip": false,
471
  "normalized": false,
 
473
  "single_word": false,
474
  "special": true
475
  },
476
+ "4055": {
477
  "content": "<extra_id_44>",
478
  "lstrip": false,
479
  "normalized": false,
 
481
  "single_word": false,
482
  "special": true
483
  },
484
+ "4056": {
485
  "content": "<extra_id_43>",
486
  "lstrip": false,
487
  "normalized": false,
 
489
  "single_word": false,
490
  "special": true
491
  },
492
+ "4057": {
493
  "content": "<extra_id_42>",
494
  "lstrip": false,
495
  "normalized": false,
 
497
  "single_word": false,
498
  "special": true
499
  },
500
+ "4058": {
501
  "content": "<extra_id_41>",
502
  "lstrip": false,
503
  "normalized": false,
 
505
  "single_word": false,
506
  "special": true
507
  },
508
+ "4059": {
509
  "content": "<extra_id_40>",
510
  "lstrip": false,
511
  "normalized": false,
 
513
  "single_word": false,
514
  "special": true
515
  },
516
+ "4060": {
517
  "content": "<extra_id_39>",
518
  "lstrip": false,
519
  "normalized": false,
 
521
  "single_word": false,
522
  "special": true
523
  },
524
+ "4061": {
525
  "content": "<extra_id_38>",
526
  "lstrip": false,
527
  "normalized": false,
 
529
  "single_word": false,
530
  "special": true
531
  },
532
+ "4062": {
533
  "content": "<extra_id_37>",
534
  "lstrip": false,
535
  "normalized": false,
 
537
  "single_word": false,
538
  "special": true
539
  },
540
+ "4063": {
541
  "content": "<extra_id_36>",
542
  "lstrip": false,
543
  "normalized": false,
 
545
  "single_word": false,
546
  "special": true
547
  },
548
+ "4064": {
549
  "content": "<extra_id_35>",
550
  "lstrip": false,
551
  "normalized": false,
 
553
  "single_word": false,
554
  "special": true
555
  },
556
+ "4065": {
557
  "content": "<extra_id_34>",
558
  "lstrip": false,
559
  "normalized": false,
 
561
  "single_word": false,
562
  "special": true
563
  },
564
+ "4066": {
565
  "content": "<extra_id_33>",
566
  "lstrip": false,
567
  "normalized": false,
 
569
  "single_word": false,
570
  "special": true
571
  },
572
+ "4067": {
573
  "content": "<extra_id_32>",
574
  "lstrip": false,
575
  "normalized": false,
 
577
  "single_word": false,
578
  "special": true
579
  },
580
+ "4068": {
581
  "content": "<extra_id_31>",
582
  "lstrip": false,
583
  "normalized": false,
 
585
  "single_word": false,
586
  "special": true
587
  },
588
+ "4069": {
589
  "content": "<extra_id_30>",
590
  "lstrip": false,
591
  "normalized": false,
 
593
  "single_word": false,
594
  "special": true
595
  },
596
+ "4070": {
597
  "content": "<extra_id_29>",
598
  "lstrip": false,
599
  "normalized": false,
 
601
  "single_word": false,
602
  "special": true
603
  },
604
+ "4071": {
605
  "content": "<extra_id_28>",
606
  "lstrip": false,
607
  "normalized": false,
 
609
  "single_word": false,
610
  "special": true
611
  },
612
+ "4072": {
613
  "content": "<extra_id_27>",
614
  "lstrip": false,
615
  "normalized": false,
 
617
  "single_word": false,
618
  "special": true
619
  },
620
+ "4073": {
621
  "content": "<extra_id_26>",
622
  "lstrip": false,
623
  "normalized": false,
 
625
  "single_word": false,
626
  "special": true
627
  },
628
+ "4074": {
629
  "content": "<extra_id_25>",
630
  "lstrip": false,
631
  "normalized": false,
 
633
  "single_word": false,
634
  "special": true
635
  },
636
+ "4075": {
637
  "content": "<extra_id_24>",
638
  "lstrip": false,
639
  "normalized": false,
 
641
  "single_word": false,
642
  "special": true
643
  },
644
+ "4076": {
645
  "content": "<extra_id_23>",
646
  "lstrip": false,
647
  "normalized": false,
 
649
  "single_word": false,
650
  "special": true
651
  },
652
+ "4077": {
653
  "content": "<extra_id_22>",
654
  "lstrip": false,
655
  "normalized": false,
 
657
  "single_word": false,
658
  "special": true
659
  },
660
+ "4078": {
661
  "content": "<extra_id_21>",
662
  "lstrip": false,
663
  "normalized": false,
 
665
  "single_word": false,
666
  "special": true
667
  },
668
+ "4079": {
669
  "content": "<extra_id_20>",
670
  "lstrip": false,
671
  "normalized": false,
 
673
  "single_word": false,
674
  "special": true
675
  },
676
+ "4080": {
677
  "content": "<extra_id_19>",
678
  "lstrip": false,
679
  "normalized": false,
 
681
  "single_word": false,
682
  "special": true
683
  },
684
+ "4081": {
685
  "content": "<extra_id_18>",
686
  "lstrip": false,
687
  "normalized": false,
 
689
  "single_word": false,
690
  "special": true
691
  },
692
+ "4082": {
693
  "content": "<extra_id_17>",
694
  "lstrip": false,
695
  "normalized": false,
 
697
  "single_word": false,
698
  "special": true
699
  },
700
+ "4083": {
701
  "content": "<extra_id_16>",
702
  "lstrip": false,
703
  "normalized": false,
 
705
  "single_word": false,
706
  "special": true
707
  },
708
+ "4084": {
709
  "content": "<extra_id_15>",
710
  "lstrip": false,
711
  "normalized": false,
 
713
  "single_word": false,
714
  "special": true
715
  },
716
+ "4085": {
717
  "content": "<extra_id_14>",
718
  "lstrip": false,
719
  "normalized": false,
 
721
  "single_word": false,
722
  "special": true
723
  },
724
+ "4086": {
725
  "content": "<extra_id_13>",
726
  "lstrip": false,
727
  "normalized": false,
 
729
  "single_word": false,
730
  "special": true
731
  },
732
+ "4087": {
733
  "content": "<extra_id_12>",
734
  "lstrip": false,
735
  "normalized": false,
 
737
  "single_word": false,
738
  "special": true
739
  },
740
+ "4088": {
741
  "content": "<extra_id_11>",
742
  "lstrip": false,
743
  "normalized": false,
 
745
  "single_word": false,
746
  "special": true
747
  },
748
+ "4089": {
749
  "content": "<extra_id_10>",
750
  "lstrip": false,
751
  "normalized": false,
 
753
  "single_word": false,
754
  "special": true
755
  },
756
+ "4090": {
757
  "content": "<extra_id_9>",
758
  "lstrip": false,
759
  "normalized": false,
 
761
  "single_word": false,
762
  "special": true
763
  },
764
+ "4091": {
765
  "content": "<extra_id_8>",
766
  "lstrip": false,
767
  "normalized": false,
 
769
  "single_word": false,
770
  "special": true
771
  },
772
+ "4092": {
773
  "content": "<extra_id_7>",
774
  "lstrip": false,
775
  "normalized": false,
 
777
  "single_word": false,
778
  "special": true
779
  },
780
+ "4093": {
781
  "content": "<extra_id_6>",
782
  "lstrip": false,
783
  "normalized": false,
 
785
  "single_word": false,
786
  "special": true
787
  },
788
+ "4094": {
789
  "content": "<extra_id_5>",
790
  "lstrip": false,
791
  "normalized": false,
 
793
  "single_word": false,
794
  "special": true
795
  },
796
+ "4095": {
797
  "content": "<extra_id_4>",
798
  "lstrip": false,
799
  "normalized": false,
 
801
  "single_word": false,
802
  "special": true
803
  },
804
+ "4096": {
805
  "content": "<extra_id_3>",
806
  "lstrip": false,
807
  "normalized": false,
 
809
  "single_word": false,
810
  "special": true
811
  },
812
+ "4097": {
813
  "content": "<extra_id_2>",
814
  "lstrip": false,
815
  "normalized": false,
 
817
  "single_word": false,
818
  "special": true
819
  },
820
+ "4098": {
821
  "content": "<extra_id_1>",
822
  "lstrip": false,
823
  "normalized": false,
 
825
  "single_word": false,
826
  "special": true
827
  },
828
+ "4099": {
829
  "content": "<extra_id_0>",
830
  "lstrip": false,
831
  "normalized": false,