AmitMY commited on
Commit
b1f5033
1 Parent(s): 201f656

Upload folder using huggingface_hub

Browse files
Files changed (8) hide show
  1. args.yaml +20 -16
  2. config +67 -451
  3. metrics +0 -0
  4. params.best +2 -2
  5. vocab.src.0.json +0 -0
  6. vocab.trg.0.json +511 -511
  7. vocab.trg.3.json +410 -426
  8. vocab.trg.4.json +623 -623
args.yaml CHANGED
@@ -24,8 +24,8 @@ dist: false
24
  dry_run: false
25
  dtype: float32
26
  embed_dropout:
27
- - 0.0
28
- - 0.0
29
  encoder: transformer
30
  end_of_prepending_tag: null
31
  env: null
@@ -37,12 +37,12 @@ ignore_extra_params: false
37
  initial_learning_rate: 0.0002
38
  keep_initializations: false
39
  keep_last_params: -1
40
- label_smoothing: 0.1
41
- label_smoothing_impl: mxnet
42
- learning_rate_reduce_factor: 0.9
43
  learning_rate_reduce_num_not_improved: 8
44
  learning_rate_scheduler_type: plateau-reduce
45
- learning_rate_warmup: 0
46
  length_task: null
47
  length_task_layers: 1
48
  length_task_weight: 1.0
@@ -65,7 +65,7 @@ min_updates: null
65
  momentum: 0.0
66
  neural_vocab_selection: null
67
  neural_vocab_selection_block_loss: false
68
- no_bucketing: false
69
  no_logfile: false
70
  no_reload_on_learning_rate_reduce: false
71
  num_embed:
@@ -83,11 +83,11 @@ optimizer_betas:
83
  - 0.9
84
  - 0.999
85
  optimizer_eps: 1.0e-08
86
- output: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors/model
87
  overwrite_output: false
88
  pad_vocab_to_multiple_of: 8
89
  params: null
90
- prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors/train_data
91
  quiet: false
92
  quiet_secondary_workers: false
93
  seed: 1
@@ -117,7 +117,7 @@ target_factors_share_embedding:
117
  - false
118
  target_factors_use_target_vocab: []
119
  target_factors_weight:
120
- - 1.0
121
  target_vocab: null
122
  tf32: true
123
  transformer_activation_type:
@@ -127,11 +127,15 @@ transformer_attention_heads:
127
  - 8
128
  - 8
129
  transformer_block_prepended_cross_attention: false
130
- transformer_dropout_act: &id001
131
- - 0.1
132
- - 0.1
133
- transformer_dropout_attention: *id001
134
- transformer_dropout_prepost: *id001
 
 
 
 
135
  transformer_feed_forward_num_hidden:
136
  - 2048
137
  - 2048
@@ -157,7 +161,7 @@ validation_target_factors:
157
  - /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_3.txt
158
  - /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_4.txt
159
  weight_decay: 0.0
160
- weight_tying_type: none
161
  word_min_count:
162
  - 1
163
  - 1
 
24
  dry_run: false
25
  dtype: float32
26
  embed_dropout:
27
+ - 0.5
28
+ - 0.5
29
  encoder: transformer
30
  end_of_prepending_tag: null
31
  env: null
 
37
  initial_learning_rate: 0.0002
38
  keep_initializations: false
39
  keep_last_params: -1
40
+ label_smoothing: 0.2
41
+ label_smoothing_impl: torch
42
+ learning_rate_reduce_factor: 0.7
43
  learning_rate_reduce_num_not_improved: 8
44
  learning_rate_scheduler_type: plateau-reduce
45
+ learning_rate_warmup: 1000
46
  length_task: null
47
  length_task_layers: 1
48
  length_task_weight: 1.0
 
65
  momentum: 0.0
66
  neural_vocab_selection: null
67
  neural_vocab_selection_block_loss: false
68
+ no_bucketing: true
69
  no_logfile: false
70
  no_reload_on_learning_rate_reduce: false
71
  num_embed:
 
83
  - 0.9
84
  - 0.999
85
  optimizer_eps: 1.0e-08
86
+ output: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-v2/model
87
  overwrite_output: false
88
  pad_vocab_to_multiple_of: 8
89
  params: null
90
+ prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/signwriting-translation/spoken-to-signed/target-factors-v2/train_data
91
  quiet: false
92
  quiet_secondary_workers: false
93
  seed: 1
 
117
  - false
118
  target_factors_use_target_vocab: []
119
  target_factors_weight:
120
+ - 0.2
121
  target_vocab: null
122
  tf32: true
123
  transformer_activation_type:
 
127
  - 8
128
  - 8
129
  transformer_block_prepended_cross_attention: false
130
+ transformer_dropout_act:
131
+ - 0.2
132
+ - 0.2
133
+ transformer_dropout_attention:
134
+ - 0.2
135
+ - 0.2
136
+ transformer_dropout_prepost:
137
+ - 0.2
138
+ - 0.2
139
  transformer_feed_forward_num_hidden:
140
  - 2048
141
  - 2048
 
161
  - /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_3.txt
162
  - /home/amoryo/sign-language/signwriting-translation/parallel/spoken-to-signed/test/target_4.txt
163
  weight_decay: 0.0
164
+ weight_tying_type: trg_softmax
165
  word_min_count:
166
  - 1
167
  - 1
config CHANGED
@@ -2,17 +2,17 @@
2
  config_data: !DataConfig
3
  data_statistics: !DataStatistics
4
  average_len_target_per_bucket:
5
- - 6.040778074691487
6
- - 10.416473840619558
7
- - 18.327804728395527
8
- - 25.791204037491006
9
- - 32.56783587028452
10
- - 41.453461051870526
11
- - 51.20251734710334
12
- - 59.77397260273977
13
- - 68.1539108494533
14
- - 75.68548175374133
15
- - 82.77498996386987
16
  - 18.47619047619048
17
  - 8.058823529411766
18
  - 5.647058823529413
@@ -67,70 +67,6 @@ config_data: !DataConfig
67
  - null
68
  - null
69
  - null
70
- - null
71
- - null
72
- - null
73
- - null
74
- - null
75
- - null
76
- - null
77
- - null
78
- - null
79
- - null
80
- - null
81
- - null
82
- - null
83
- - null
84
- - null
85
- - null
86
- - null
87
- - null
88
- - null
89
- - null
90
- - null
91
- - null
92
- - null
93
- - null
94
- - null
95
- - null
96
- - null
97
- - null
98
- - null
99
- - null
100
- - null
101
- - null
102
- - null
103
- - null
104
- - null
105
- - null
106
- - null
107
- - null
108
- - null
109
- - null
110
- - null
111
- - null
112
- - null
113
- - null
114
- - null
115
- - null
116
- - null
117
- - null
118
- - null
119
- - null
120
- - null
121
- - null
122
- - null
123
- - null
124
- - null
125
- - null
126
- - null
127
- - null
128
- - null
129
- - null
130
- - null
131
- - null
132
- - null
133
- - null
134
  buckets:
135
  - !!python/tuple
136
  - 8
@@ -325,235 +261,43 @@ config_data: !DataConfig
325
  - 512
326
  - 512
327
  - !!python/tuple
328
- - 520
329
- - 520
330
- - !!python/tuple
331
- - 528
332
- - 528
333
- - !!python/tuple
334
- - 536
335
- - 536
336
- - !!python/tuple
337
- - 544
338
- - 544
339
- - !!python/tuple
340
- - 552
341
- - 552
342
- - !!python/tuple
343
- - 560
344
- - 560
345
- - !!python/tuple
346
- - 568
347
- - 568
348
- - !!python/tuple
349
- - 576
350
- - 576
351
- - !!python/tuple
352
- - 584
353
- - 584
354
- - !!python/tuple
355
- - 592
356
- - 592
357
- - !!python/tuple
358
- - 600
359
- - 600
360
- - !!python/tuple
361
- - 608
362
- - 608
363
- - !!python/tuple
364
- - 616
365
- - 616
366
- - !!python/tuple
367
- - 624
368
- - 624
369
- - !!python/tuple
370
- - 632
371
- - 632
372
- - !!python/tuple
373
- - 640
374
- - 640
375
- - !!python/tuple
376
- - 648
377
- - 648
378
- - !!python/tuple
379
- - 656
380
- - 656
381
- - !!python/tuple
382
- - 664
383
- - 664
384
- - !!python/tuple
385
- - 672
386
- - 672
387
- - !!python/tuple
388
- - 680
389
- - 680
390
- - !!python/tuple
391
- - 688
392
- - 688
393
- - !!python/tuple
394
- - 696
395
- - 696
396
- - !!python/tuple
397
- - 704
398
- - 704
399
- - !!python/tuple
400
- - 712
401
- - 712
402
- - !!python/tuple
403
- - 720
404
- - 720
405
- - !!python/tuple
406
- - 728
407
- - 728
408
- - !!python/tuple
409
- - 736
410
- - 736
411
- - !!python/tuple
412
- - 744
413
- - 744
414
- - !!python/tuple
415
- - 752
416
- - 752
417
- - !!python/tuple
418
- - 760
419
- - 760
420
- - !!python/tuple
421
- - 768
422
- - 768
423
- - !!python/tuple
424
- - 776
425
- - 776
426
- - !!python/tuple
427
- - 784
428
- - 784
429
- - !!python/tuple
430
- - 792
431
- - 792
432
- - !!python/tuple
433
- - 800
434
- - 800
435
- - !!python/tuple
436
- - 808
437
- - 808
438
- - !!python/tuple
439
- - 816
440
- - 816
441
- - !!python/tuple
442
- - 824
443
- - 824
444
- - !!python/tuple
445
- - 832
446
- - 832
447
- - !!python/tuple
448
- - 840
449
- - 840
450
- - !!python/tuple
451
- - 848
452
- - 848
453
- - !!python/tuple
454
- - 856
455
- - 856
456
- - !!python/tuple
457
- - 864
458
- - 864
459
- - !!python/tuple
460
- - 872
461
- - 872
462
- - !!python/tuple
463
- - 880
464
- - 880
465
- - !!python/tuple
466
- - 888
467
- - 888
468
- - !!python/tuple
469
- - 896
470
- - 896
471
- - !!python/tuple
472
- - 904
473
- - 904
474
- - !!python/tuple
475
- - 912
476
- - 912
477
- - !!python/tuple
478
- - 920
479
- - 920
480
- - !!python/tuple
481
- - 928
482
- - 928
483
- - !!python/tuple
484
- - 936
485
- - 936
486
- - !!python/tuple
487
- - 944
488
- - 944
489
- - !!python/tuple
490
- - 952
491
- - 952
492
- - !!python/tuple
493
- - 960
494
- - 960
495
- - !!python/tuple
496
- - 968
497
- - 968
498
- - !!python/tuple
499
- - 976
500
- - 976
501
- - !!python/tuple
502
- - 984
503
- - 984
504
- - !!python/tuple
505
- - 992
506
- - 992
507
- - !!python/tuple
508
- - 1000
509
- - 1000
510
- - !!python/tuple
511
- - 1008
512
- - 1008
513
- - !!python/tuple
514
- - 1016
515
- - 1016
516
- - !!python/tuple
517
- - 1024
518
- - 1024
519
- - !!python/tuple
520
- - 1025
521
- - 1025
522
- length_ratio_mean: 1.474495632217424
523
  length_ratio_stats_per_bucket:
524
  - !!python/tuple
525
- - 1.171734791437263
526
- - 0.32090434080799957
527
  - !!python/tuple
528
- - 1.7775684905617388
529
- - 0.6755588117515812
530
  - !!python/tuple
531
- - 2.6955079688959103
532
- - 1.0817522224393123
533
  - !!python/tuple
534
- - 3.2268563970102235
535
- - 1.8158811093408354
536
  - !!python/tuple
537
- - 3.500774012901702
538
- - 2.6322306923249954
539
  - !!python/tuple
540
- - 3.644524011869326
541
- - 2.535690409212411
542
  - !!python/tuple
543
- - 3.9292123470643947
544
- - 2.929607461215888
545
  - !!python/tuple
546
- - 3.615506743731907
547
- - 2.7129084144914977
548
  - !!python/tuple
549
- - 3.6799270986509405
550
- - 2.7267508355326386
551
  - !!python/tuple
552
- - 3.8125038570611314
553
- - 2.930899091057965
554
  - !!python/tuple
555
- - 3.535487200424593
556
- - 2.256728773617209
557
  - !!python/tuple
558
  - 0.19909941868381043
559
  - 0.2555613448334357
@@ -628,87 +372,23 @@ config_data: !DataConfig
628
  - *id001
629
  - *id001
630
  - *id001
631
- - *id001
632
- - *id001
633
- - *id001
634
- - *id001
635
- - *id001
636
- - *id001
637
- - *id001
638
- - *id001
639
- - *id001
640
- - *id001
641
- - *id001
642
- - *id001
643
- - *id001
644
- - *id001
645
- - *id001
646
- - *id001
647
- - *id001
648
- - *id001
649
- - *id001
650
- - *id001
651
- - *id001
652
- - *id001
653
- - *id001
654
- - *id001
655
- - *id001
656
- - *id001
657
- - *id001
658
- - *id001
659
- - *id001
660
- - *id001
661
- - *id001
662
- - *id001
663
- - *id001
664
- - *id001
665
- - *id001
666
- - *id001
667
- - *id001
668
- - *id001
669
- - *id001
670
- - *id001
671
- - *id001
672
- - *id001
673
- - *id001
674
- - *id001
675
- - *id001
676
- - *id001
677
- - *id001
678
- - *id001
679
- - *id001
680
- - *id001
681
- - *id001
682
- - *id001
683
- - *id001
684
- - *id001
685
- - *id001
686
- - *id001
687
- - *id001
688
- - *id001
689
- - *id001
690
- - *id001
691
- - *id001
692
- - *id001
693
- - *id001
694
- - *id001
695
- length_ratio_std: 0.8564867301273484
696
  max_observed_len_source: 299
697
  max_observed_len_target: 87
698
  num_discarded: 0
699
- num_sents: 1802816
700
  num_sents_per_bucket:
701
- - 1163076
702
- - 525949
703
- - 52153
704
- - 13870
705
- - 7555
706
- - 5533
707
- - 6197
708
- - 7446
709
- - 8323
710
- - 7618
711
- - 4982
712
  - 42
713
  - 17
714
  - 17
@@ -763,79 +443,15 @@ config_data: !DataConfig
763
  - 0
764
  - 0
765
  - 0
766
- - 0
767
- - 0
768
- - 0
769
- - 0
770
- - 0
771
- - 0
772
- - 0
773
- - 0
774
- - 0
775
- - 0
776
- - 0
777
- - 0
778
- - 0
779
- - 0
780
- - 0
781
- - 0
782
- - 0
783
- - 0
784
- - 0
785
- - 0
786
- - 0
787
- - 0
788
- - 0
789
- - 0
790
- - 0
791
- - 0
792
- - 0
793
- - 0
794
- - 0
795
- - 0
796
- - 0
797
- - 0
798
- - 0
799
- - 0
800
- - 0
801
- - 0
802
- - 0
803
- - 0
804
- - 0
805
- - 0
806
- - 0
807
- - 0
808
- - 0
809
- - 0
810
- - 0
811
- - 0
812
- - 0
813
- - 0
814
- - 0
815
- - 0
816
- - 0
817
- - 0
818
- - 0
819
- - 0
820
- - 0
821
- - 0
822
- - 0
823
- - 0
824
- - 0
825
- - 0
826
- - 0
827
- - 0
828
- - 0
829
- - 0
830
- num_tokens_source: 11289426
831
- num_tokens_target: 16613258
832
  num_unks_source: 0
833
  num_unks_target: 0
834
  size_vocab_source: 46256
835
  size_vocab_target: 656
836
  eop_id: -1
837
- max_seq_len_source: 1025
838
- max_seq_len_target: 1025
839
  num_source_factors: 1
840
  num_target_factors: 5
841
  config_decoder: !TransformerConfig
@@ -844,12 +460,12 @@ config_decoder: !TransformerConfig
844
  block_prepended_cross_attention: false
845
  decoder_type: transformer
846
  depth_key_value: 512
847
- dropout_act: 0.1
848
- dropout_attention: 0.1
849
- dropout_prepost: 0.1
850
  feed_forward_num_hidden: 2048
851
- max_seq_len_source: 1025
852
- max_seq_len_target: 1025
853
  model_size: 512
854
  num_layers: 6
855
  positional_embedding_type: fixed
@@ -859,14 +475,14 @@ config_decoder: !TransformerConfig
859
  use_lhuc: false
860
  config_embed_source: !EmbeddingConfig
861
  allow_sparse_grad: false
862
- dropout: 0.0
863
  factor_configs: null
864
  num_embed: 512
865
  num_factors: 1
866
  vocab_size: 46256
867
  config_embed_target: !EmbeddingConfig
868
  allow_sparse_grad: false
869
- dropout: 0.0
870
  factor_configs:
871
  - !FactorConfig
872
  combine: sum
@@ -882,7 +498,7 @@ config_embed_target: !EmbeddingConfig
882
  combine: sum
883
  num_embed: 512
884
  share_embedding: false
885
- vocab_size: 432
886
  - !FactorConfig
887
  combine: sum
888
  num_embed: 512
@@ -897,12 +513,12 @@ config_encoder: !TransformerConfig
897
  block_prepended_cross_attention: false
898
  decoder_type: transformer
899
  depth_key_value: 512
900
- dropout_act: 0.1
901
- dropout_attention: 0.1
902
- dropout_prepost: 0.1
903
  feed_forward_num_hidden: 2048
904
- max_seq_len_source: 1025
905
- max_seq_len_target: 1025
906
  model_size: 512
907
  num_layers: 6
908
  positional_embedding_type: fixed
@@ -917,4 +533,4 @@ neural_vocab_selection: null
917
  neural_vocab_selection_block_loss: false
918
  vocab_source_size: 46256
919
  vocab_target_size: 656
920
- weight_tying_type: none
 
2
  config_data: !DataConfig
3
  data_statistics: !DataStatistics
4
  average_len_target_per_bucket:
5
+ - 6.043404555083469
6
+ - 10.519883768009015
7
+ - 18.59887856456265
8
+ - 26.278671761476776
9
+ - 33.190033876079
10
+ - 41.83887781695534
11
+ - 51.24769950218732
12
+ - 59.783405313440575
13
+ - 68.16214942257864
14
+ - 75.68928386092358
15
+ - 82.77250900360164
16
  - 18.47619047619048
17
  - 8.058823529411766
18
  - 5.647058823529413
 
67
  - null
68
  - null
69
  - null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
70
  buckets:
71
  - !!python/tuple
72
  - 8
 
261
  - 512
262
  - 512
263
  - !!python/tuple
264
+ - 513
265
+ - 513
266
+ length_ratio_mean: 1.488763422684226
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
267
  length_ratio_stats_per_bucket:
268
  - !!python/tuple
269
+ - 1.172606268110977
270
+ - 0.3198943487302755
271
  - !!python/tuple
272
+ - 1.7758876999918463
273
+ - 0.6634649712813119
274
  - !!python/tuple
275
+ - 2.667916151313991
276
+ - 1.011426597835219
277
  - !!python/tuple
278
+ - 3.173004208160318
279
+ - 1.618051536035044
280
  - !!python/tuple
281
+ - 3.3799284759654693
282
+ - 2.4421821481902017
283
  - !!python/tuple
284
+ - 3.5445340678088186
285
+ - 2.377062423666999
286
  - !!python/tuple
287
+ - 3.870005889139779
288
+ - 2.8520973384152954
289
  - !!python/tuple
290
+ - 3.6032825677516436
291
+ - 2.6820622916732426
292
  - !!python/tuple
293
+ - 3.672787931128752
294
+ - 2.7023842818124146
295
  - !!python/tuple
296
+ - 3.807871945448423
297
+ - 2.9154974163883414
298
  - !!python/tuple
299
+ - 3.5339756014008112
300
+ - 2.253656007685683
301
  - !!python/tuple
302
  - 0.19909941868381043
303
  - 0.2555613448334357
 
372
  - *id001
373
  - *id001
374
  - *id001
375
+ length_ratio_std: 0.8554135166970332
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
376
  max_observed_len_source: 299
377
  max_observed_len_target: 87
378
  num_discarded: 0
379
+ num_sents: 1874353
380
  num_sents_per_bucket:
381
+ - 1183908
382
+ - 558194
383
+ - 62420
384
+ - 18581
385
+ - 9151
386
+ - 6523
387
+ - 6629
388
+ - 7641
389
+ - 8486
390
+ - 7708
391
+ - 4998
392
  - 42
393
  - 17
394
  - 17
 
443
  - 0
444
  - 0
445
  - 0
446
+ num_tokens_source: 11815202
447
+ num_tokens_target: 17626167
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
448
  num_unks_source: 0
449
  num_unks_target: 0
450
  size_vocab_source: 46256
451
  size_vocab_target: 656
452
  eop_id: -1
453
+ max_seq_len_source: 513
454
+ max_seq_len_target: 513
455
  num_source_factors: 1
456
  num_target_factors: 5
457
  config_decoder: !TransformerConfig
 
460
  block_prepended_cross_attention: false
461
  decoder_type: transformer
462
  depth_key_value: 512
463
+ dropout_act: 0.2
464
+ dropout_attention: 0.2
465
+ dropout_prepost: 0.2
466
  feed_forward_num_hidden: 2048
467
+ max_seq_len_source: 513
468
+ max_seq_len_target: 513
469
  model_size: 512
470
  num_layers: 6
471
  positional_embedding_type: fixed
 
475
  use_lhuc: false
476
  config_embed_source: !EmbeddingConfig
477
  allow_sparse_grad: false
478
+ dropout: 0.5
479
  factor_configs: null
480
  num_embed: 512
481
  num_factors: 1
482
  vocab_size: 46256
483
  config_embed_target: !EmbeddingConfig
484
  allow_sparse_grad: false
485
+ dropout: 0.5
486
  factor_configs:
487
  - !FactorConfig
488
  combine: sum
 
498
  combine: sum
499
  num_embed: 512
500
  share_embedding: false
501
+ vocab_size: 416
502
  - !FactorConfig
503
  combine: sum
504
  num_embed: 512
 
513
  block_prepended_cross_attention: false
514
  decoder_type: transformer
515
  depth_key_value: 512
516
+ dropout_act: 0.2
517
+ dropout_attention: 0.2
518
+ dropout_prepost: 0.2
519
  feed_forward_num_hidden: 2048
520
+ max_seq_len_source: 513
521
+ max_seq_len_target: 513
522
  model_size: 512
523
  num_layers: 6
524
  positional_embedding_type: fixed
 
533
  neural_vocab_selection_block_loss: false
534
  vocab_source_size: 46256
535
  vocab_target_size: 656
536
+ weight_tying_type: trg_softmax
metrics CHANGED
The diff for this file is too large to render. See raw diff
 
params.best CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ac93c9756112673592b1ab863938af87dcffb3b3d4c34e512359d5e8ce45ca1
3
- size 283070459
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c57f2a6fd2b40d982a122389c2fdd52c8d3bf1b2527fbd673cb75302803153fa
3
+ size 279564030
vocab.src.0.json CHANGED
The diff for this file is too large to render. See raw diff
 
vocab.trg.0.json CHANGED
@@ -5,485 +5,485 @@
5
  "</s>": 3,
6
  "M": 4,
7
  "S205": 5,
8
- "S15a": 6,
9
  "S100": 7,
10
- "S14c": 8,
11
  "S265": 9,
12
- "S15d": 10,
13
- "S203": 11,
14
  "S22a": 12,
15
  "S36d": 13,
16
  "S2ff": 14,
17
  "S35d": 15,
18
  "S266": 16,
19
- "S20e": 17,
20
- "S22b": 18,
21
  "S10e": 19,
22
  "S1f7": 20,
23
- "S300": 21,
24
- "S1dc": 22,
25
- "S1f5": 23,
26
- "S221": 24,
27
- "S2fb": 25,
28
- "S115": 26,
29
- "S206": 27,
30
- "S2f9": 28,
31
- "S185": 29,
32
- "S176": 30,
33
- "S211": 31,
34
- "S1ce": 32,
35
- "S26a": 33,
36
- "S16d": 34,
37
- "S30a": 35,
38
- "S22f": 36,
39
- "S301": 37,
40
- "S347": 38,
41
- "S34c": 39,
42
- "S192": 40,
43
- "S288": 41,
44
- "S144": 42,
45
- "S378": 43,
46
- "S377": 44,
47
- "S33b": 45,
48
- "S2ea": 46,
49
- "S388": 47,
50
- "S19a": 48,
51
- "S1ea": 49,
52
- "S350": 50,
53
- "S11e": 51,
54
- "S2a2": 52,
55
- "S2df": 53,
56
- "S14a": 54,
57
- "S361": 55,
58
- "S2b7": 56,
59
- "S225": 57,
60
- "S348": 58,
61
- "S150": 59,
62
- "S387": 60,
63
- "S344": 61,
64
- "S271": 62,
65
- "S11a": 63,
66
- "S147": 64,
67
- "S321": 65,
68
- "S365": 66,
69
- "S180": 67,
70
- "S2d6": 68,
71
- "S101": 69,
72
- "S10a": 70,
73
- "S30c": 71,
74
- "S289": 72,
75
- "S346": 73,
76
- "S26c": 74,
77
- "S2f7": 75,
78
- "S119": 76,
79
- "S1f0": 77,
80
- "S35c": 78,
81
- "S140": 79,
82
- "S314": 80,
83
- "S106": 81,
84
  "S1ed": 82,
85
- "S182": 83,
86
- "S216": 84,
87
- "S33e": 85,
88
- "S22e": 86,
89
- "S1c5": 87,
90
- "S153": 88,
91
- "S2fc": 89,
92
- "L": 90,
93
- "S236": 91,
94
- "S2e7": 92,
95
- "S21b": 93,
96
- "S379": 94,
97
- "S222": 95,
98
- "S214": 96,
99
- "S345": 97,
100
- "S177": 98,
101
- "S18d": 99,
102
- "S1d4": 100,
103
- "S181": 101,
104
- "S2e5": 102,
105
- "S187": 103,
106
- "S2c6": 104,
107
- "S231": 105,
108
- "S118": 106,
109
- "S110": 107,
110
  "S1f4": 108,
111
- "S269": 109,
112
  "S20b": 110,
113
  "S142": 111,
114
- "S208": 112,
115
- "S2eb": 113,
116
- "S230": 114,
117
- "S2e2": 115,
118
  "S267": 116,
119
  "S30e": 117,
120
- "S324": 118,
121
- "S30d": 119,
122
- "S2c3": 120,
123
- "S207": 121,
124
- "S157": 122,
125
- "S376": 123,
126
- "R": 124,
127
- "S14e": 125,
128
- "S28a": 126,
129
- "S331": 127,
130
- "S154": 128,
131
- "S315": 129,
132
- "S17d": 130,
133
- "S340": 131,
134
- "S1bb": 132,
135
- "S36a": 133,
136
- "S1eb": 134,
137
- "S37a": 135,
138
- "S303": 136,
139
- "S30f": 137,
140
- "S218": 138,
141
- "S22c": 139,
142
- "S255": 140,
143
- "S2d5": 141,
144
- "S186": 142,
145
- "S2f8": 143,
146
- "S31a": 144,
147
- "S26b": 145,
148
- "S2fd": 146,
149
- "S1fb": 147,
150
- "S1ec": 148,
151
- "S2e3": 149,
152
- "S152": 150,
153
- "S16c": 151,
154
- "S10b": 152,
155
- "S37b": 153,
156
- "S1f8": 154,
157
- "S20f": 155,
158
- "S226": 156,
159
- "S1d2": 157,
160
- "S2d2": 158,
161
- "S32a": 159,
162
- "S1de": 160,
163
- "S316": 161,
164
- "S34d": 162,
165
- "S21d": 163,
166
- "S1a0": 164,
167
- "S358": 165,
168
- "S34a": 166,
169
- "S2e1": 167,
170
- "S330": 168,
171
- "S389": 169,
172
- "S36e": 170,
173
- "S272": 171,
174
- "S1a5": 172,
175
- "S1e1": 173,
176
- "S309": 174,
177
- "S12d": 175,
178
- "S2f0": 176,
179
- "S26f": 177,
180
- "S2a5": 178,
181
- "S335": 179,
182
- "S16f": 180,
183
- "S37d": 181,
184
- "S20a": 182,
185
- "S2e8": 183,
186
- "S2a4": 184,
187
- "S332": 185,
188
- "S2ef": 186,
189
- "S341": 187,
190
- "S2e0": 188,
191
- "S1d3": 189,
192
- "S219": 190,
193
- "S37c": 191,
194
- "S245": 192,
195
- "S234": 193,
196
- "S1f2": 194,
197
- "S1ee": 195,
198
- "S319": 196,
199
- "S2b8": 197,
200
- "S28b": 198,
201
- "S30b": 199,
202
- "S171": 200,
203
- "S18c": 201,
204
- "S310": 202,
205
- "S2d7": 203,
206
- "S23b": 204,
207
- "S1f1": 205,
208
- "S2a6": 206,
209
- "S17e": 207,
210
- "S33f": 208,
211
- "S21c": 209,
212
- "S256": 210,
213
- "S10c": 211,
214
- "S1ef": 212,
215
- "S2e6": 213,
216
- "S2a3": 214,
217
- "S299": 215,
218
- "S17f": 216,
219
- "S1d1": 217,
220
- "S342": 218,
221
- "S13f": 219,
222
- "S160": 220,
223
- "S210": 221,
224
- "S357": 222,
225
- "S18e": 223,
226
- "S281": 224,
227
- "S237": 225,
228
- "S343": 226,
229
- "S20c": 227,
230
- "S227": 228,
231
- "S228": 229,
232
- "S36b": 230,
233
- "S238": 231,
234
- "S155": 232,
235
- "S371": 233,
236
- "S2c5": 234,
237
- "S175": 235,
238
- "S26d": 236,
239
- "S36f": 237,
240
- "S251": 238,
241
- "S292": 239,
242
- "S248": 240,
243
- "S128": 241,
244
- "S217": 242,
245
- "S349": 243,
246
- "S2d8": 244,
247
- "S2c7": 245,
248
- "S2c4": 246,
249
  "S158": 247,
250
- "S1da": 248,
251
- "S307": 249,
252
- "S23c": 250,
253
- "S293": 251,
254
- "S17c": 252,
255
- "S353": 253,
256
- "S16e": 254,
257
- "S268": 255,
258
  "S287": 256,
259
- "S2ad": 257,
260
- "S2e9": 258,
261
- "S294": 259,
262
- "S24e": 260,
263
- "S2b9": 261,
264
- "S2ed": 262,
265
- "S259": 263,
266
- "S31e": 264,
267
- "S368": 265,
268
- "S1fa": 266,
269
- "S28c": 267,
270
- "S239": 268,
271
- "S31b": 269,
272
- "S19c": 270,
273
- "S333": 271,
274
  "S212": 272,
275
- "S32b": 273,
276
- "S198": 274,
277
- "S213": 275,
278
- "S29a": 276,
279
- "S33d": 277,
280
- "S356": 278,
281
- "S34f": 279,
282
- "S215": 280,
283
- "S23d": 281,
284
- "S233": 282,
285
- "S2ec": 283,
286
- "S1d0": 284,
287
- "S173": 285,
288
- "S22d": 286,
289
- "S1c1": 287,
290
- "S35a": 288,
291
- "S2dc": 289,
292
- "S178": 290,
293
- "S2dd": 291,
294
- "S2fa": 292,
295
- "S2e4": 293,
296
- "S370": 294,
297
- "S232": 295,
298
- "S129": 296,
299
- "S167": 297,
300
- "S21e": 298,
301
- "S1cf": 299,
302
- "S38a": 300,
303
- "S201": 301,
304
- "S13d": 302,
305
- "S1e4": 303,
306
- "S145": 304,
307
- "S14b": 305,
308
- "S235": 306,
309
- "S33c": 307,
310
- "S156": 308,
311
- "S17b": 309,
312
- "S229": 310,
313
- "S249": 311,
314
- "S284": 312,
315
- "S27a": 313,
316
- "S1f9": 314,
317
- "S2da": 315,
318
- "S1e8": 316,
319
- "S23f": 317,
320
- "S363": 318,
321
- "S2d9": 319,
322
- "S24b": 320,
323
- "S32c": 321,
324
- "S1c3": 322,
325
- "S273": 323,
326
- "S295": 324,
327
- "S151": 325,
328
- "S29f": 326,
329
- "S2bd": 327,
330
- "S35b": 328,
331
- "S179": 329,
332
- "S244": 330,
333
- "S270": 331,
334
- "S1df": 332,
335
- "S336": 333,
336
- "S2be": 334,
337
- "S351": 335,
338
- "S34e": 336,
339
- "S2d3": 337,
340
- "S296": 338,
341
- "S174": 339,
342
- "S23a": 340,
343
- "S116": 341,
344
- "S15f": 342,
345
- "S305": 343,
346
- "S1d5": 344,
347
- "S2ee": 345,
348
- "S122": 346,
349
- "S337": 347,
350
- "S35f": 348,
351
- "S1d8": 349,
352
- "S121": 350,
353
- "S1cd": 351,
354
- "S298": 352,
355
- "S25a": 353,
356
- "S14f": 354,
357
- "S243": 355,
358
- "S369": 356,
359
- "S132": 357,
360
- "S105": 358,
361
- "S1ca": 359,
362
- "S241": 360,
363
- "S1e0": 361,
364
- "S172": 362,
365
- "S37e": 363,
366
- "S313": 364,
367
- "S2c1": 365,
368
- "S141": 366,
369
- "S257": 367,
370
- "S14d": 368,
371
- "S28d": 369,
372
- "S112": 370,
373
- "S19d": 371,
374
- "S240": 372,
375
- "S339": 373,
376
- "S311": 374,
377
- "S29b": 375,
378
- "S21a": 376,
379
- "S21f": 377,
380
- "S18b": 378,
381
- "S359": 379,
382
- "S1e2": 380,
383
- "S15b": 381,
384
- "S28e": 382,
385
- "S10f": 383,
386
- "S1c6": 384,
387
- "S276": 385,
388
- "S2bb": 386,
389
- "S133": 387,
390
- "S127": 388,
391
- "S2f1": 389,
392
- "S27e": 390,
393
- "S15c": 391,
394
- "S2db": 392,
395
- "S283": 393,
396
- "S277": 394,
397
- "S224": 395,
398
- "S25e": 396,
399
- "S374": 397,
400
- "S297": 398,
401
- "S290": 399,
402
- "S386": 400,
403
- "S1e6": 401,
404
- "S220": 402,
405
- "S166": 403,
406
- "S24d": 404,
407
- "S209": 405,
408
- "S17a": 406,
409
- "S170": 407,
410
- "S275": 408,
411
- "S2d4": 409,
412
- "S362": 410,
413
- "S28f": 411,
414
- "S253": 412,
415
- "S204": 413,
416
- "S12b": 414,
417
- "S302": 415,
418
- "S304": 416,
419
- "S109": 417,
420
- "S2a0": 418,
421
- "S367": 419,
422
- "S1c0": 420,
423
- "S1ba": 421,
424
- "S25d": 422,
425
- "S246": 423,
426
- "S1a3": 424,
427
- "S20d": 425,
428
- "S1fd": 426,
429
- "S11d": 427,
430
- "S2ba": 428,
431
- "S2bf": 429,
432
- "S1e5": 430,
433
- "S1a7": 431,
434
- "S124": 432,
435
- "S1fc": 433,
436
- "S312": 434,
437
- "S274": 435,
438
- "S27b": 436,
439
- "S1bc": 437,
440
- "S24a": 438,
441
- "S38b": 439,
442
- "S113": 440,
443
- "S242": 441,
444
- "S291": 442,
445
- "S29c": 443,
446
- "S33a": 444,
447
- "S262": 445,
448
- "S194": 446,
449
- "S1a8": 447,
450
- "S223": 448,
451
- "S35e": 449,
452
- "S146": 450,
453
- "S375": 451,
454
- "S1f6": 452,
455
- "S2a1": 453,
456
- "S34b": 454,
457
- "S1e7": 455,
458
- "S250": 456,
459
- "S1d9": 457,
460
- "S10d": 458,
461
- "S1a1": 459,
462
- "S138": 460,
463
- "S2de": 461,
464
- "S308": 462,
465
- "S2f5": 463,
466
- "S282": 464,
467
- "S103": 465,
468
  "S15e": 466,
469
- "S1ff": 467,
470
- "S354": 468,
471
- "S31f": 469,
472
  "S2f4": 470,
473
- "S36c": 471,
474
- "S183": 472,
475
- "S360": 473,
476
- "S12a": 474,
477
- "S352": 475,
478
- "S279": 476,
479
- "S338": 477,
480
- "S31c": 478,
481
- "S328": 479,
482
- "S2c8": 480,
483
- "S1c2": 481,
484
- "S2c2": 482,
485
- "S1d6": 483,
486
- "S1e3": 484,
487
  "S25b": 485,
488
  "S364": 486,
489
  "S134": 487,
@@ -498,8 +498,8 @@
498
  "S327": 496,
499
  "S384": 497,
500
  "S1c9": 498,
501
- "S11b": 499,
502
- "S26e": 500,
503
  "S2f2": 501,
504
  "S323": 502,
505
  "S1a6": 503,
@@ -510,33 +510,33 @@
510
  "S286": 508,
511
  "S254": 509,
512
  "S372": 510,
513
- "S2aa": 511,
514
- "S168": 512,
515
  "S385": 513,
516
  "S1b0": 514,
517
  "S2f6": 515,
518
  "S162": 516,
519
  "S247": 517,
520
  "S1a4": 518,
521
- "S107": 519,
522
- "S2b1": 520,
523
- "S2f3": 521,
524
- "S19b": 522,
525
- "S102": 523,
526
- "S258": 524,
527
- "S29d": 525,
528
- "S2bc": 526,
529
- "S24f": 527,
530
  "S1c4": 528,
531
  "S1ae": 529,
532
  "S135": 530,
533
- "S1b8": 531,
534
- "S2d0": 532,
535
  "S355": 533,
536
- "S1db": 534,
537
- "S169": 535,
538
- "S285": 536,
539
- "S159": 537,
540
  "S163": 538,
541
  "S11f": 539,
542
  "S329": 540,
@@ -549,12 +549,12 @@
549
  "S2a8": 547,
550
  "S190": 548,
551
  "S334": 549,
552
- "S131": 550,
553
- "S2c0": 551,
554
  "S114": 552,
555
  "S373": 553,
556
- "S12c": 554,
557
- "S1b3": 555,
558
  "S200": 556,
559
  "S2ae": 557,
560
  "S18f": 558,
@@ -563,20 +563,20 @@
563
  "S11c": 561,
564
  "S196": 562,
565
  "S202": 563,
566
- "S25f": 564,
567
- "S2a7": 565,
568
  "S326": 566,
569
  "S32e": 567,
570
  "S2cd": 568,
571
  "S1fe": 569,
572
- "S280": 570,
573
- "S1d7": 571,
574
  "S12e": 572,
575
  "S18a": 573,
576
  "S322": 574,
577
  "S2af": 575,
578
- "S1bf": 576,
579
- "S2cc": 577,
580
  "S318": 578,
581
  "S19f": 579,
582
  "S193": 580,
@@ -587,9 +587,9 @@
587
  "S13e": 585,
588
  "S1a2": 586,
589
  "S366": 587,
590
- "S117": 588,
591
- "S27d": 589,
592
- "S25c": 590,
593
  "S197": 591,
594
  "S2c9": 592,
595
  "S2ca": 593,
@@ -599,16 +599,16 @@
599
  "S2b2": 597,
600
  "S104": 598,
601
  "S2ab": 599,
602
- "S1af": 600,
603
- "S2ce": 601,
604
- "S263": 602,
605
- "S264": 603,
606
- "S1cc": 604,
607
- "S1cb": 605,
608
- "S195": 606,
609
- "S13c": 607,
610
- "S381": 608,
611
- "S1b7": 609,
612
  "S1b2": 610,
613
  "S1aa": 611,
614
  "S191": 612,
@@ -624,16 +624,16 @@
624
  "S383": 622,
625
  "S1ab": 623,
626
  "S2b5": 624,
627
- "S2a9": 625,
628
- "S1b1": 626,
629
- "S382": 627,
630
- "S2cf": 628,
631
- "S380": 629,
632
- "S125": 630,
633
- "S143": 631,
634
- "S23e": 632,
635
- "S19e": 633,
636
- "S126": 634,
637
  "S2b0": 635,
638
  "S136": 636,
639
  "S137": 637,
 
5
  "</s>": 3,
6
  "M": 4,
7
  "S205": 5,
8
+ "S14c": 6,
9
  "S100": 7,
10
+ "S15a": 8,
11
  "S265": 9,
12
+ "S203": 10,
13
+ "S15d": 11,
14
  "S22a": 12,
15
  "S36d": 13,
16
  "S2ff": 14,
17
  "S35d": 15,
18
  "S266": 16,
19
+ "S1dc": 17,
20
+ "S20e": 18,
21
  "S10e": 19,
22
  "S1f7": 20,
23
+ "S176": 21,
24
+ "S1f5": 22,
25
+ "S115": 23,
26
+ "S22b": 24,
27
+ "S300": 25,
28
+ "S2f9": 26,
29
+ "S221": 27,
30
+ "S2fb": 28,
31
+ "S206": 29,
32
+ "S1ce": 30,
33
+ "S185": 31,
34
+ "S16d": 32,
35
+ "S211": 33,
36
+ "S26a": 34,
37
+ "S144": 35,
38
+ "S192": 36,
39
+ "S22f": 37,
40
+ "S30a": 38,
41
+ "S11e": 39,
42
+ "S301": 40,
43
+ "S14a": 41,
44
+ "S347": 42,
45
+ "S34c": 43,
46
+ "S288": 44,
47
+ "S378": 45,
48
+ "S19a": 46,
49
+ "S377": 47,
50
+ "S2a2": 48,
51
+ "S33b": 49,
52
+ "S1ea": 50,
53
+ "S388": 51,
54
+ "S2ea": 52,
55
+ "S350": 53,
56
+ "S11a": 54,
57
+ "S101": 55,
58
+ "S2df": 56,
59
+ "S119": 57,
60
+ "S147": 58,
61
+ "S361": 59,
62
+ "S2b7": 60,
63
+ "S150": 61,
64
+ "S225": 62,
65
+ "S348": 63,
66
+ "S387": 64,
67
+ "S344": 65,
68
+ "S10a": 66,
69
+ "S271": 67,
70
+ "S140": 68,
71
+ "S321": 69,
72
+ "S365": 70,
73
+ "S1f0": 71,
74
+ "S180": 72,
75
+ "S2d6": 73,
76
+ "S30c": 74,
77
+ "S289": 75,
78
+ "S346": 76,
79
+ "S106": 77,
80
+ "S26c": 78,
81
+ "S2f7": 79,
82
+ "S35c": 80,
83
+ "S314": 81,
84
  "S1ed": 82,
85
+ "S187": 83,
86
+ "S18d": 84,
87
+ "S216": 85,
88
+ "S182": 86,
89
+ "S33e": 87,
90
+ "S22e": 88,
91
+ "S1c5": 89,
92
+ "S153": 90,
93
+ "S2fc": 91,
94
+ "S222": 92,
95
+ "L": 93,
96
+ "S2e7": 94,
97
+ "S236": 95,
98
+ "S21b": 96,
99
+ "S379": 97,
100
+ "S214": 98,
101
+ "S345": 99,
102
+ "S177": 100,
103
+ "S1d4": 101,
104
+ "S181": 102,
105
+ "S110": 103,
106
+ "S2e5": 104,
107
+ "S2c6": 105,
108
+ "S231": 106,
109
+ "S118": 107,
110
  "S1f4": 108,
111
+ "S208": 109,
112
  "S20b": 110,
113
  "S142": 111,
114
+ "S269": 112,
115
+ "S2e2": 113,
116
+ "S2eb": 114,
117
+ "S230": 115,
118
  "S267": 116,
119
  "S30e": 117,
120
+ "S2c3": 118,
121
+ "S324": 119,
122
+ "S207": 120,
123
+ "S30d": 121,
124
+ "S186": 122,
125
+ "S1bb": 123,
126
+ "S157": 124,
127
+ "S1eb": 125,
128
+ "S14e": 126,
129
+ "S376": 127,
130
+ "R": 128,
131
+ "S28a": 129,
132
+ "S331": 130,
133
+ "S154": 131,
134
+ "S17d": 132,
135
+ "S315": 133,
136
+ "S340": 134,
137
+ "S36a": 135,
138
+ "S1ec": 136,
139
+ "S37a": 137,
140
+ "S1fb": 138,
141
+ "S303": 139,
142
+ "S30f": 140,
143
+ "S218": 141,
144
+ "S22c": 142,
145
+ "S255": 143,
146
+ "S1de": 144,
147
+ "S2d5": 145,
148
+ "S2e3": 146,
149
+ "S2f8": 147,
150
+ "S2fd": 148,
151
+ "S31a": 149,
152
+ "S26b": 150,
153
+ "S1f8": 151,
154
+ "S1d2": 152,
155
+ "S152": 153,
156
+ "S16c": 154,
157
+ "S10b": 155,
158
+ "S37b": 156,
159
+ "S226": 157,
160
+ "S20f": 158,
161
+ "S1a5": 159,
162
+ "S1a0": 160,
163
+ "S1f2": 161,
164
+ "S2d2": 162,
165
+ "S32a": 163,
166
+ "S316": 164,
167
+ "S34d": 165,
168
+ "S21d": 166,
169
+ "S358": 167,
170
+ "S18e": 168,
171
+ "S2e1": 169,
172
+ "S34a": 170,
173
+ "S1d3": 171,
174
+ "S245": 172,
175
+ "S330": 173,
176
+ "S389": 174,
177
+ "S36e": 175,
178
+ "S272": 176,
179
+ "S12d": 177,
180
+ "S1e1": 178,
181
+ "S309": 179,
182
+ "S20a": 180,
183
+ "S2f0": 181,
184
+ "S2a5": 182,
185
+ "S26f": 183,
186
+ "S18c": 184,
187
+ "S335": 185,
188
+ "S16f": 186,
189
+ "S37d": 187,
190
+ "S2e8": 188,
191
+ "S2a4": 189,
192
+ "S332": 190,
193
+ "S2ef": 191,
194
+ "S2e0": 192,
195
+ "S219": 193,
196
+ "S341": 194,
197
+ "S37c": 195,
198
+ "S234": 196,
199
+ "S1ee": 197,
200
+ "S1da": 198,
201
+ "S2b8": 199,
202
+ "S319": 200,
203
+ "S21c": 201,
204
+ "S28b": 202,
205
+ "S1f1": 203,
206
+ "S175": 204,
207
+ "S13f": 205,
208
+ "S171": 206,
209
+ "S30b": 207,
210
+ "S2d7": 208,
211
+ "S310": 209,
212
+ "S23b": 210,
213
+ "S17e": 211,
214
+ "S2a6": 212,
215
+ "S256": 213,
216
+ "S33f": 214,
217
+ "S1ef": 215,
218
+ "S10c": 216,
219
+ "S2e6": 217,
220
+ "S299": 218,
221
+ "S2a3": 219,
222
+ "S17f": 220,
223
+ "S1d1": 221,
224
+ "S238": 222,
225
+ "S342": 223,
226
+ "S160": 224,
227
+ "S210": 225,
228
+ "S357": 226,
229
+ "S198": 227,
230
+ "S281": 228,
231
+ "S237": 229,
232
+ "S343": 230,
233
+ "S227": 231,
234
+ "S20c": 232,
235
+ "S228": 233,
236
+ "S36b": 234,
237
+ "S155": 235,
238
+ "S371": 236,
239
+ "S2c5": 237,
240
+ "S26d": 238,
241
+ "S201": 239,
242
+ "S36f": 240,
243
+ "S251": 241,
244
+ "S292": 242,
245
+ "S248": 243,
246
+ "S128": 244,
247
+ "S217": 245,
248
+ "S2d8": 246,
249
  "S158": 247,
250
+ "S349": 248,
251
+ "S2c7": 249,
252
+ "S2c4": 250,
253
+ "S23c": 251,
254
+ "S293": 252,
255
+ "S307": 253,
256
+ "S167": 254,
257
+ "S17c": 255,
258
  "S287": 256,
259
+ "S268": 257,
260
+ "S353": 258,
261
+ "S16e": 259,
262
+ "S2ad": 260,
263
+ "S2e9": 261,
264
+ "S24e": 262,
265
+ "S294": 263,
266
+ "S2b9": 264,
267
+ "S2ed": 265,
268
+ "S259": 266,
269
+ "S31e": 267,
270
+ "S368": 268,
271
+ "S28c": 269,
272
+ "S1fa": 270,
273
+ "S239": 271,
274
  "S212": 272,
275
+ "S31b": 273,
276
+ "S19c": 274,
277
+ "S333": 275,
278
+ "S32b": 276,
279
+ "S1cf": 277,
280
+ "S213": 278,
281
+ "S29a": 279,
282
+ "S33d": 280,
283
+ "S34f": 281,
284
+ "S356": 282,
285
+ "S23d": 283,
286
+ "S215": 284,
287
+ "S2ec": 285,
288
+ "S233": 286,
289
+ "S1d0": 287,
290
+ "S173": 288,
291
+ "S22d": 289,
292
+ "S15f": 290,
293
+ "S1c1": 291,
294
+ "S35a": 292,
295
+ "S2dc": 293,
296
+ "S178": 294,
297
+ "S2dd": 295,
298
+ "S2fa": 296,
299
+ "S232": 297,
300
+ "S1d5": 298,
301
+ "S1ca": 299,
302
+ "S141": 300,
303
+ "S2e4": 301,
304
+ "S129": 302,
305
+ "S370": 303,
306
+ "S21e": 304,
307
+ "S1d8": 305,
308
+ "S105": 306,
309
+ "S1cd": 307,
310
+ "S38a": 308,
311
+ "S13d": 309,
312
+ "S1e4": 310,
313
+ "S145": 311,
314
+ "S14b": 312,
315
+ "S235": 313,
316
+ "S156": 314,
317
+ "S284": 315,
318
+ "S33c": 316,
319
+ "S116": 317,
320
+ "S17b": 318,
321
+ "S229": 319,
322
+ "S249": 320,
323
+ "S27a": 321,
324
+ "S1f9": 322,
325
+ "S2da": 323,
326
+ "S23f": 324,
327
+ "S1e8": 325,
328
+ "S24b": 326,
329
+ "S2d9": 327,
330
+ "S363": 328,
331
+ "S32c": 329,
332
+ "S1c3": 330,
333
+ "S273": 331,
334
+ "S295": 332,
335
+ "S2f1": 333,
336
+ "S29f": 334,
337
+ "S151": 335,
338
+ "S2bd": 336,
339
+ "S1c6": 337,
340
+ "S35b": 338,
341
+ "S179": 339,
342
+ "S1e0": 340,
343
+ "S1df": 341,
344
+ "S244": 342,
345
+ "S270": 343,
346
+ "S336": 344,
347
+ "S2be": 345,
348
+ "S351": 346,
349
+ "S2d3": 347,
350
+ "S34e": 348,
351
+ "S174": 349,
352
+ "S296": 350,
353
+ "S23a": 351,
354
+ "S305": 352,
355
+ "S2ee": 353,
356
+ "S122": 354,
357
+ "S337": 355,
358
+ "S35f": 356,
359
+ "S121": 357,
360
+ "S298": 358,
361
+ "S25a": 359,
362
+ "S14f": 360,
363
+ "S243": 361,
364
+ "S369": 362,
365
+ "S132": 363,
366
+ "S241": 364,
367
+ "S1fd": 365,
368
+ "S172": 366,
369
+ "S37e": 367,
370
+ "S10f": 368,
371
+ "S2c1": 369,
372
+ "S257": 370,
373
+ "S313": 371,
374
+ "S14d": 372,
375
+ "S28d": 373,
376
+ "S112": 374,
377
+ "S19d": 375,
378
+ "S240": 376,
379
+ "S339": 377,
380
+ "S29b": 378,
381
+ "S311": 379,
382
+ "S11d": 380,
383
+ "S21a": 381,
384
+ "S21f": 382,
385
+ "S1fc": 383,
386
+ "S18b": 384,
387
+ "S15b": 385,
388
+ "S28e": 386,
389
+ "S359": 387,
390
+ "S1e2": 388,
391
+ "S2bb": 389,
392
+ "S276": 390,
393
+ "S127": 391,
394
+ "S133": 392,
395
+ "S27e": 393,
396
+ "S15c": 394,
397
+ "S2db": 395,
398
+ "S283": 396,
399
+ "S277": 397,
400
+ "S224": 398,
401
+ "S25e": 399,
402
+ "S374": 400,
403
+ "S290": 401,
404
+ "S297": 402,
405
+ "S1e6": 403,
406
+ "S386": 404,
407
+ "S220": 405,
408
+ "S166": 406,
409
+ "S24d": 407,
410
+ "S209": 408,
411
+ "S275": 409,
412
+ "S17a": 410,
413
+ "S170": 411,
414
+ "S2d4": 412,
415
+ "S362": 413,
416
+ "S1e5": 414,
417
+ "S28f": 415,
418
+ "S253": 416,
419
+ "S12b": 417,
420
+ "S204": 418,
421
+ "S302": 419,
422
+ "S2a0": 420,
423
+ "S304": 421,
424
+ "S109": 422,
425
+ "S1d9": 423,
426
+ "S367": 424,
427
+ "S1c0": 425,
428
+ "S1ba": 426,
429
+ "S25d": 427,
430
+ "S246": 428,
431
+ "S1a3": 429,
432
+ "S20d": 430,
433
+ "S2bf": 431,
434
+ "S2ba": 432,
435
+ "S124": 433,
436
+ "S1a7": 434,
437
+ "S1a1": 435,
438
+ "S1d6": 436,
439
+ "S312": 437,
440
+ "S274": 438,
441
+ "S1bc": 439,
442
+ "S27b": 440,
443
+ "S24a": 441,
444
+ "S38b": 442,
445
+ "S113": 443,
446
+ "S242": 444,
447
+ "S223": 445,
448
+ "S291": 446,
449
+ "S29c": 447,
450
+ "S33a": 448,
451
+ "S262": 449,
452
+ "S194": 450,
453
+ "S1a8": 451,
454
+ "S35e": 452,
455
+ "S146": 453,
456
+ "S375": 454,
457
+ "S2a1": 455,
458
+ "S1f6": 456,
459
+ "S34b": 457,
460
+ "S1e7": 458,
461
+ "S250": 459,
462
+ "S10d": 460,
463
+ "S138": 461,
464
+ "S2de": 462,
465
+ "S308": 463,
466
+ "S2f5": 464,
467
+ "S282": 465,
468
  "S15e": 466,
469
+ "S103": 467,
470
+ "S1ff": 468,
471
+ "S354": 469,
472
  "S2f4": 470,
473
+ "S31f": 471,
474
+ "S36c": 472,
475
+ "S183": 473,
476
+ "S360": 474,
477
+ "S12a": 475,
478
+ "S352": 476,
479
+ "S279": 477,
480
+ "S328": 478,
481
+ "S338": 479,
482
+ "S31c": 480,
483
+ "S2c8": 481,
484
+ "S1e3": 482,
485
+ "S2c2": 483,
486
+ "S1c2": 484,
487
  "S25b": 485,
488
  "S364": 486,
489
  "S134": 487,
 
498
  "S327": 496,
499
  "S384": 497,
500
  "S1c9": 498,
501
+ "S26e": 499,
502
+ "S11b": 500,
503
  "S2f2": 501,
504
  "S323": 502,
505
  "S1a6": 503,
 
510
  "S286": 508,
511
  "S254": 509,
512
  "S372": 510,
513
+ "S168": 511,
514
+ "S2aa": 512,
515
  "S385": 513,
516
  "S1b0": 514,
517
  "S2f6": 515,
518
  "S162": 516,
519
  "S247": 517,
520
  "S1a4": 518,
521
+ "S24f": 519,
522
+ "S107": 520,
523
+ "S2b1": 521,
524
+ "S2f3": 522,
525
+ "S258": 523,
526
+ "S29d": 524,
527
+ "S19b": 525,
528
+ "S102": 526,
529
+ "S2bc": 527,
530
  "S1c4": 528,
531
  "S1ae": 529,
532
  "S135": 530,
533
+ "S2d0": 531,
534
+ "S1b8": 532,
535
  "S355": 533,
536
+ "S159": 534,
537
+ "S1db": 535,
538
+ "S169": 536,
539
+ "S285": 537,
540
  "S163": 538,
541
  "S11f": 539,
542
  "S329": 540,
 
549
  "S2a8": 547,
550
  "S190": 548,
551
  "S334": 549,
552
+ "S2c0": 550,
553
+ "S131": 551,
554
  "S114": 552,
555
  "S373": 553,
556
+ "S1b3": 554,
557
+ "S12c": 555,
558
  "S200": 556,
559
  "S2ae": 557,
560
  "S18f": 558,
 
563
  "S11c": 561,
564
  "S196": 562,
565
  "S202": 563,
566
+ "S2a7": 564,
567
+ "S25f": 565,
568
  "S326": 566,
569
  "S32e": 567,
570
  "S2cd": 568,
571
  "S1fe": 569,
572
+ "S1d7": 570,
573
+ "S280": 571,
574
  "S12e": 572,
575
  "S18a": 573,
576
  "S322": 574,
577
  "S2af": 575,
578
+ "S2cc": 576,
579
+ "S1bf": 577,
580
  "S318": 578,
581
  "S19f": 579,
582
  "S193": 580,
 
587
  "S13e": 585,
588
  "S1a2": 586,
589
  "S366": 587,
590
+ "S25c": 588,
591
+ "S117": 589,
592
+ "S27d": 590,
593
  "S197": 591,
594
  "S2c9": 592,
595
  "S2ca": 593,
 
599
  "S2b2": 597,
600
  "S104": 598,
601
  "S2ab": 599,
602
+ "S1b7": 600,
603
+ "S1af": 601,
604
+ "S2ce": 602,
605
+ "S263": 603,
606
+ "S264": 604,
607
+ "S1cc": 605,
608
+ "S1cb": 606,
609
+ "S195": 607,
610
+ "S13c": 608,
611
+ "S381": 609,
612
  "S1b2": 610,
613
  "S1aa": 611,
614
  "S191": 612,
 
624
  "S383": 622,
625
  "S1ab": 623,
626
  "S2b5": 624,
627
+ "S1b1": 625,
628
+ "S2a9": 626,
629
+ "S23e": 627,
630
+ "S382": 628,
631
+ "S2cf": 629,
632
+ "S380": 630,
633
+ "S125": 631,
634
+ "S143": 632,
635
+ "S126": 633,
636
+ "S19e": 634,
637
  "S2b0": 635,
638
  "S136": 636,
639
  "S137": 637,
vocab.trg.3.json CHANGED
@@ -3,432 +3,416 @@
3
  "<unk>": 1,
4
  "<s>": 2,
5
  "</s>": 3,
6
- "p482": 4,
7
- "p500": 5,
8
- "p493": 6,
9
- "p479": 7,
10
- "p492": 8,
11
  "p489": 9,
12
  "p490": 10,
13
- "p518": 11,
14
- "p494": 12,
15
- "p488": 13,
16
- "p495": 14,
17
- "p491": 15,
18
- "p521": 16,
19
- "p487": 17,
20
- "p496": 18,
21
- "p497": 19,
22
- "p481": 20,
23
- "p486": 21,
24
- "p485": 22,
25
- "p501": 23,
26
- "p511": 24,
27
- "p498": 25,
28
- "p512": 26,
29
- "p483": 27,
30
- "p480": 28,
31
- "p464": 29,
32
- "p477": 30,
33
- "p515": 31,
34
- "p502": 32,
35
- "p476": 33,
36
- "p508": 34,
37
- "p510": 35,
38
- "p520": 36,
39
- "p519": 37,
40
- "p513": 38,
41
- "p509": 39,
42
- "p503": 40,
43
- "p522": 41,
44
- "p514": 42,
45
- "p505": 43,
46
- "p507": 44,
47
- "p478": 45,
48
- "p484": 46,
49
- "p504": 47,
50
- "p524": 48,
51
- "p523": 49,
52
- "p506": 50,
53
- "p499": 51,
54
- "p463": 52,
55
- "p527": 53,
56
- "p472": 54,
57
- "p474": 55,
58
- "p525": 56,
59
- "p526": 57,
60
- "p516": 58,
61
- "p528": 59,
62
- "p475": 60,
63
- "p517": 61,
64
- "p473": 62,
65
- "p467": 63,
66
- "p468": 64,
67
- "p471": 65,
68
- "p529": 66,
69
- "p470": 67,
70
- "p469": 68,
71
- "p530": 69,
72
- "p533": 70,
73
- "p531": 71,
74
- "p466": 72,
75
- "p534": 73,
76
- "p532": 74,
77
- "p535": 75,
78
- "p537": 76,
79
- "p465": 77,
80
- "p536": 78,
81
- "p540": 79,
82
- "p538": 80,
83
- "p539": 81,
84
- "p541": 82,
85
- "p542": 83,
86
- "p461": 84,
87
- "p543": 85,
88
- "p462": 86,
89
- "p544": 87,
90
- "p460": 88,
91
- "p453": 89,
92
- "p459": 90,
93
- "p545": 91,
94
- "p452": 92,
95
- "p547": 93,
96
- "p548": 94,
97
- "p546": 95,
98
- "p458": 96,
99
- "p454": 97,
100
- "p549": 98,
101
- "p455": 99,
102
- "p457": 100,
103
- "p456": 101,
104
- "p550": 102,
105
- "p451": 103,
106
- "p551": 104,
107
- "p552": 105,
108
- "p553": 106,
109
- "p554": 107,
110
- "p555": 108,
111
- "p556": 109,
112
- "p450": 110,
113
- "p557": 111,
114
- "p438": 112,
115
- "p449": 113,
116
- "p437": 114,
117
- "p558": 115,
118
- "p560": 116,
119
- "p559": 117,
120
- "p448": 118,
121
- "p562": 119,
122
- "p447": 120,
123
- "p561": 121,
124
- "p563": 122,
125
- "p446": 123,
126
- "p439": 124,
127
- "p444": 125,
128
- "p445": 126,
129
- "p440": 127,
130
- "p442": 128,
131
- "p564": 129,
132
- "p443": 130,
133
- "p565": 131,
134
- "p436": 132,
135
- "p441": 133,
136
- "p566": 134,
137
- "p567": 135,
138
- "p570": 136,
139
- "p569": 137,
140
- "p571": 138,
141
- "p568": 139,
142
- "p423": 140,
143
- "p577": 141,
144
- "p573": 142,
145
- "p578": 143,
146
- "p572": 144,
147
- "p576": 145,
148
- "p422": 146,
149
- "p424": 147,
150
- "p435": 148,
151
- "p574": 149,
152
- "p575": 150,
153
- "p433": 151,
154
- "p434": 152,
155
- "p425": 153,
156
- "p430": 154,
157
- "p579": 155,
158
- "p432": 156,
159
- "p431": 157,
160
- "p580": 158,
161
- "p582": 159,
162
- "p429": 160,
163
- "p581": 161,
164
- "p426": 162,
165
- "p428": 163,
166
- "p427": 164,
167
- "p421": 165,
168
- "p409": 166,
169
- "p583": 167,
170
- "p588": 168,
171
- "p584": 169,
172
- "p591": 170,
173
- "p408": 171,
174
- "p587": 172,
175
- "p592": 173,
176
- "p420": 174,
177
- "p593": 175,
178
- "p585": 176,
179
- "p586": 177,
180
- "p419": 178,
181
- "p417": 179,
182
- "p407": 180,
183
- "p590": 181,
184
- "p410": 182,
185
- "p589": 183,
186
- "p411": 184,
187
- "p416": 185,
188
- "p418": 186,
189
- "p412": 187,
190
- "p414": 188,
191
- "p413": 189,
192
- "p415": 190,
193
- "p594": 191,
194
- "p406": 192,
195
- "p596": 193,
196
- "p595": 194,
197
- "p405": 195,
198
- "p404": 196,
199
- "p597": 197,
200
- "p599": 198,
201
- "p606": 199,
202
- "p600": 200,
203
- "p607": 201,
204
- "p605": 202,
205
- "p598": 203,
206
- "p403": 204,
207
- "p601": 205,
208
- "p604": 206,
209
- "p602": 207,
210
- "p395": 208,
211
- "p402": 209,
212
- "p393": 210,
213
- "p394": 211,
214
- "p608": 212,
215
- "p401": 213,
216
- "p603": 214,
217
- "p624": 215,
218
- "p400": 216,
219
- "p396": 217,
220
- "p610": 218,
221
- "p613": 219,
222
- "p399": 220,
223
- "p609": 221,
224
- "p398": 222,
225
- "p614": 223,
226
- "p611": 224,
227
- "p397": 225,
228
- "p623": 226,
229
- "p612": 227,
230
- "p376": 228,
231
- "p389": 229,
232
- "p619": 230,
233
- "p391": 231,
234
- "p392": 232,
235
- "p618": 233,
236
- "p622": 234,
237
- "p620": 235,
238
- "p388": 236,
239
- "p387": 237,
240
- "p617": 238,
241
- "p386": 239,
242
- "p621": 240,
243
- "p390": 241,
244
- "p616": 242,
245
- "p615": 243,
246
- "p377": 244,
247
- "p382": 245,
248
- "p385": 246,
249
- "p384": 247,
250
- "p381": 248,
251
- "p383": 249,
252
- "p380": 250,
253
- "p379": 251,
254
- "p378": 252,
255
- "p625": 253,
256
- "p626": 254,
257
- "p375": 255,
258
- "p627": 256,
259
- "p631": 257,
260
- "p629": 258,
261
- "p628": 259,
262
- "p630": 260,
263
- "p633": 261,
264
- "p632": 262,
265
- "p634": 263,
266
- "p635": 264,
267
- "p636": 265,
268
- "p373": 266,
269
- "p640": 267,
270
- "p637": 268,
271
- "p638": 269,
272
- "p374": 270,
273
- "p371": 271,
274
- "p639": 272,
275
- "p372": 273,
276
- "p641": 274,
277
- "p643": 275,
278
- "p370": 276,
279
- "p368": 277,
280
- "p645": 278,
281
- "p365": 279,
282
- "p362": 280,
283
- "p369": 281,
284
- "p644": 282,
285
- "p646": 283,
286
- "p642": 284,
287
- "p366": 285,
288
- "p360": 286,
289
- "p648": 287,
290
- "p363": 288,
291
- "p650": 289,
292
- "p367": 290,
293
- "p649": 291,
294
- "p364": 292,
295
- "p651": 293,
296
- "p354": 294,
297
- "p654": 295,
298
- "p655": 296,
299
- "p652": 297,
300
- "p361": 298,
301
- "p647": 299,
302
- "p653": 300,
303
- "p664": 301,
304
- "p355": 302,
305
- "p351": 303,
306
- "p346": 304,
307
- "p665": 305,
308
- "p657": 306,
309
- "p353": 307,
310
- "p348": 308,
311
- "p356": 309,
312
- "p337": 310,
313
- "p667": 311,
314
- "p342": 312,
315
- "p357": 313,
316
- "p673": 314,
317
- "p661": 315,
318
- "p349": 316,
319
- "p359": 317,
320
- "p660": 318,
321
- "p656": 319,
322
- "p659": 320,
323
- "p663": 321,
324
- "p352": 322,
325
- "p358": 323,
326
- "p343": 324,
327
- "p350": 325,
328
- "p347": 326,
329
- "p662": 327,
330
- "p338": 328,
331
- "p658": 329,
332
- "p669": 330,
333
- "p671": 331,
334
- "p344": 332,
335
- "p679": 333,
336
- "p666": 334,
337
- "p670": 335,
338
- "p341": 336,
339
- "p335": 337,
340
- "p345": 338,
341
- "p339": 339,
342
- "p688": 340,
343
- "p700": 341,
344
- "p684": 342,
345
- "p680": 343,
346
- "p340": 344,
347
- "p683": 345,
348
- "p333": 346,
349
- "p326": 347,
350
- "p685": 348,
351
- "p331": 349,
352
- "p676": 350,
353
- "p687": 351,
354
- "p675": 352,
355
- "p682": 353,
356
- "p334": 354,
357
- "p320": 355,
358
- "p697": 356,
359
- "p672": 357,
360
- "p692": 358,
361
- "p689": 359,
362
- "p336": 360,
363
- "p693": 361,
364
- "p690": 362,
365
- "p715": 363,
366
- "p711": 364,
367
- "p703": 365,
368
- "p691": 366,
369
- "p668": 367,
370
- "p698": 368,
371
- "p323": 369,
372
- "p309": 370,
373
- "p705": 371,
374
- "p330": 372,
375
- "p317": 373,
376
- "p303": 374,
377
- "p311": 375,
378
- "p714": 376,
379
- "p713": 377,
380
- "p327": 378,
381
- "p325": 379,
382
- "p329": 380,
383
- "p718": 381,
384
- "p681": 382,
385
- "p677": 383,
386
- "p674": 384,
387
- "p321": 385,
388
- "p313": 386,
389
- "p708": 387,
390
- "p696": 388,
391
- "p706": 389,
392
- "p314": 390,
393
- "p288": 391,
394
- "p678": 392,
395
- "p318": 393,
396
- "p702": 394,
397
- "p719": 395,
398
- "p707": 396,
399
- "p725": 397,
400
- "p699": 398,
401
- "p332": 399,
402
- "p704": 400,
403
- "p324": 401,
404
- "p307": 402,
405
- "p315": 403,
406
- "p308": 404,
407
- "p304": 405,
408
- "p695": 406,
409
- "p319": 407,
410
- "p310": 408,
411
- "p316": 409,
412
- "p312": 410,
413
- "p298": 411,
414
- "p295": 412,
415
- "p710": 413,
416
- "p283": 414,
417
- "p282": 415,
418
- "p281": 416,
419
- "p280": 417,
420
- "p278": 418,
421
- "p717": 419,
422
- "p322": 420,
423
- "p300": 421,
424
- "p724": 422,
425
- "p701": 423,
426
- "p686": 424,
427
- "p301": 425,
428
- "p291": 426,
429
- "<pad427>": 427,
430
- "<pad428>": 428,
431
- "<pad429>": 429,
432
- "<pad430>": 430,
433
- "<pad431>": 431
434
  }
 
3
  "<unk>": 1,
4
  "<s>": 2,
5
  "</s>": 3,
6
+ "p500": 4,
7
+ "p482": 5,
8
+ "p492": 6,
9
+ "p493": 7,
10
+ "p479": 8,
11
  "p489": 9,
12
  "p490": 10,
13
+ "p488": 11,
14
+ "p491": 12,
15
+ "p494": 13,
16
+ "p487": 14,
17
+ "p495": 15,
18
+ "p486": 16,
19
+ "p485": 17,
20
+ "p481": 18,
21
+ "p496": 19,
22
+ "p501": 20,
23
+ "p477": 21,
24
+ "p497": 22,
25
+ "p498": 23,
26
+ "p483": 24,
27
+ "p480": 25,
28
+ "p476": 26,
29
+ "p464": 27,
30
+ "p502": 28,
31
+ "p478": 29,
32
+ "p505": 30,
33
+ "p484": 31,
34
+ "p503": 32,
35
+ "p504": 33,
36
+ "p499": 34,
37
+ "p511": 35,
38
+ "p510": 36,
39
+ "p507": 37,
40
+ "p509": 38,
41
+ "p512": 39,
42
+ "p506": 40,
43
+ "p463": 41,
44
+ "p474": 42,
45
+ "p472": 43,
46
+ "p508": 44,
47
+ "p475": 45,
48
+ "p513": 46,
49
+ "p473": 47,
50
+ "p515": 48,
51
+ "p467": 49,
52
+ "p514": 50,
53
+ "p468": 51,
54
+ "p519": 52,
55
+ "p471": 53,
56
+ "p520": 54,
57
+ "p518": 55,
58
+ "p521": 56,
59
+ "p470": 57,
60
+ "p469": 58,
61
+ "p516": 59,
62
+ "p517": 60,
63
+ "p522": 61,
64
+ "p466": 62,
65
+ "p523": 63,
66
+ "p524": 64,
67
+ "p465": 65,
68
+ "p525": 66,
69
+ "p526": 67,
70
+ "p527": 68,
71
+ "p461": 69,
72
+ "p462": 70,
73
+ "p528": 71,
74
+ "p460": 72,
75
+ "p453": 73,
76
+ "p459": 74,
77
+ "p452": 75,
78
+ "p529": 76,
79
+ "p458": 77,
80
+ "p530": 78,
81
+ "p454": 79,
82
+ "p531": 80,
83
+ "p455": 81,
84
+ "p457": 82,
85
+ "p456": 83,
86
+ "p532": 84,
87
+ "p451": 85,
88
+ "p533": 86,
89
+ "p534": 87,
90
+ "p535": 88,
91
+ "p540": 89,
92
+ "p541": 90,
93
+ "p538": 91,
94
+ "p536": 92,
95
+ "p537": 93,
96
+ "p539": 94,
97
+ "p450": 95,
98
+ "p542": 96,
99
+ "p449": 97,
100
+ "p438": 98,
101
+ "p437": 99,
102
+ "p448": 100,
103
+ "p447": 101,
104
+ "p446": 102,
105
+ "p439": 103,
106
+ "p543": 104,
107
+ "p445": 105,
108
+ "p444": 106,
109
+ "p440": 107,
110
+ "p544": 108,
111
+ "p547": 109,
112
+ "p545": 110,
113
+ "p442": 111,
114
+ "p546": 112,
115
+ "p443": 113,
116
+ "p548": 114,
117
+ "p436": 115,
118
+ "p441": 116,
119
+ "p555": 117,
120
+ "p549": 118,
121
+ "p553": 119,
122
+ "p551": 120,
123
+ "p556": 121,
124
+ "p552": 122,
125
+ "p550": 123,
126
+ "p423": 124,
127
+ "p557": 125,
128
+ "p554": 126,
129
+ "p435": 127,
130
+ "p422": 128,
131
+ "p424": 129,
132
+ "p433": 130,
133
+ "p434": 131,
134
+ "p558": 132,
135
+ "p425": 133,
136
+ "p430": 134,
137
+ "p560": 135,
138
+ "p432": 136,
139
+ "p559": 137,
140
+ "p431": 138,
141
+ "p561": 139,
142
+ "p429": 140,
143
+ "p562": 141,
144
+ "p426": 142,
145
+ "p428": 143,
146
+ "p427": 144,
147
+ "p563": 145,
148
+ "p421": 146,
149
+ "p564": 147,
150
+ "p409": 148,
151
+ "p571": 149,
152
+ "p569": 150,
153
+ "p565": 151,
154
+ "p567": 152,
155
+ "p570": 153,
156
+ "p566": 154,
157
+ "p408": 155,
158
+ "p568": 156,
159
+ "p420": 157,
160
+ "p572": 158,
161
+ "p419": 159,
162
+ "p407": 160,
163
+ "p417": 161,
164
+ "p410": 162,
165
+ "p573": 163,
166
+ "p411": 164,
167
+ "p416": 165,
168
+ "p574": 166,
169
+ "p418": 167,
170
+ "p412": 168,
171
+ "p577": 169,
172
+ "p414": 170,
173
+ "p575": 171,
174
+ "p413": 172,
175
+ "p415": 173,
176
+ "p406": 174,
177
+ "p576": 175,
178
+ "p578": 176,
179
+ "p580": 177,
180
+ "p582": 178,
181
+ "p579": 179,
182
+ "p581": 180,
183
+ "p583": 181,
184
+ "p588": 182,
185
+ "p587": 183,
186
+ "p584": 184,
187
+ "p405": 185,
188
+ "p404": 186,
189
+ "p585": 187,
190
+ "p586": 188,
191
+ "p403": 189,
192
+ "p395": 190,
193
+ "p402": 191,
194
+ "p393": 192,
195
+ "p589": 193,
196
+ "p394": 194,
197
+ "p401": 195,
198
+ "p590": 196,
199
+ "p400": 197,
200
+ "p591": 198,
201
+ "p396": 199,
202
+ "p399": 200,
203
+ "p592": 201,
204
+ "p398": 202,
205
+ "p397": 203,
206
+ "p593": 204,
207
+ "p594": 205,
208
+ "p376": 206,
209
+ "p389": 207,
210
+ "p391": 208,
211
+ "p392": 209,
212
+ "p595": 210,
213
+ "p388": 211,
214
+ "p387": 212,
215
+ "p596": 213,
216
+ "p386": 214,
217
+ "p390": 215,
218
+ "p599": 216,
219
+ "p597": 217,
220
+ "p377": 218,
221
+ "p382": 219,
222
+ "p385": 220,
223
+ "p600": 221,
224
+ "p598": 222,
225
+ "p384": 223,
226
+ "p381": 224,
227
+ "p383": 225,
228
+ "p601": 226,
229
+ "p380": 227,
230
+ "p379": 228,
231
+ "p378": 229,
232
+ "p602": 230,
233
+ "p606": 231,
234
+ "p603": 232,
235
+ "p604": 233,
236
+ "p605": 234,
237
+ "p607": 235,
238
+ "p608": 236,
239
+ "p609": 237,
240
+ "p610": 238,
241
+ "p375": 239,
242
+ "p611": 240,
243
+ "p612": 241,
244
+ "p613": 242,
245
+ "p614": 243,
246
+ "p615": 244,
247
+ "p619": 245,
248
+ "p618": 246,
249
+ "p616": 247,
250
+ "p617": 248,
251
+ "p373": 249,
252
+ "p620": 250,
253
+ "p621": 251,
254
+ "p374": 252,
255
+ "p371": 253,
256
+ "p625": 254,
257
+ "p372": 255,
258
+ "p623": 256,
259
+ "p622": 257,
260
+ "p370": 258,
261
+ "p629": 259,
262
+ "p624": 260,
263
+ "p368": 261,
264
+ "p626": 262,
265
+ "p365": 263,
266
+ "p362": 264,
267
+ "p631": 265,
268
+ "p369": 266,
269
+ "p628": 267,
270
+ "p627": 268,
271
+ "p366": 269,
272
+ "p360": 270,
273
+ "p634": 271,
274
+ "p363": 272,
275
+ "p632": 273,
276
+ "p630": 274,
277
+ "p633": 275,
278
+ "p367": 276,
279
+ "p364": 277,
280
+ "p637": 278,
281
+ "p354": 279,
282
+ "p361": 280,
283
+ "p635": 281,
284
+ "p355": 282,
285
+ "p351": 283,
286
+ "p640": 284,
287
+ "p346": 285,
288
+ "p639": 286,
289
+ "p636": 287,
290
+ "p638": 288,
291
+ "p641": 289,
292
+ "p353": 290,
293
+ "p348": 291,
294
+ "p356": 292,
295
+ "p643": 293,
296
+ "p337": 294,
297
+ "p649": 295,
298
+ "p342": 296,
299
+ "p357": 297,
300
+ "p655": 298,
301
+ "p653": 299,
302
+ "p349": 300,
303
+ "p359": 301,
304
+ "p648": 302,
305
+ "p646": 303,
306
+ "p642": 304,
307
+ "p358": 305,
308
+ "p352": 306,
309
+ "p650": 307,
310
+ "p343": 308,
311
+ "p645": 309,
312
+ "p350": 310,
313
+ "p347": 311,
314
+ "p651": 312,
315
+ "p338": 313,
316
+ "p665": 314,
317
+ "p652": 315,
318
+ "p344": 316,
319
+ "p647": 317,
320
+ "p341": 318,
321
+ "p654": 319,
322
+ "p335": 320,
323
+ "p345": 321,
324
+ "p339": 322,
325
+ "p340": 323,
326
+ "p660": 324,
327
+ "p679": 325,
328
+ "p663": 326,
329
+ "p333": 327,
330
+ "p659": 328,
331
+ "p326": 329,
332
+ "p331": 330,
333
+ "p644": 331,
334
+ "p662": 332,
335
+ "p688": 333,
336
+ "p658": 334,
337
+ "p664": 335,
338
+ "p334": 336,
339
+ "p320": 337,
340
+ "p700": 338,
341
+ "p666": 339,
342
+ "p673": 340,
343
+ "p684": 341,
344
+ "p336": 342,
345
+ "p671": 343,
346
+ "p657": 344,
347
+ "p669": 345,
348
+ "p667": 346,
349
+ "p670": 347,
350
+ "p698": 348,
351
+ "p323": 349,
352
+ "p309": 350,
353
+ "p692": 351,
354
+ "p330": 352,
355
+ "p317": 353,
356
+ "p303": 354,
357
+ "p311": 355,
358
+ "p661": 356,
359
+ "p656": 357,
360
+ "p327": 358,
361
+ "p325": 359,
362
+ "p668": 360,
363
+ "p329": 361,
364
+ "p321": 362,
365
+ "p313": 363,
366
+ "p696": 364,
367
+ "p314": 365,
368
+ "p288": 366,
369
+ "p675": 367,
370
+ "p318": 368,
371
+ "p690": 369,
372
+ "p672": 370,
373
+ "p680": 371,
374
+ "p691": 372,
375
+ "p682": 373,
376
+ "p332": 374,
377
+ "p704": 375,
378
+ "p689": 376,
379
+ "p683": 377,
380
+ "p676": 378,
381
+ "p324": 379,
382
+ "p307": 380,
383
+ "p693": 381,
384
+ "p674": 382,
385
+ "p315": 383,
386
+ "p308": 384,
387
+ "p304": 385,
388
+ "p319": 386,
389
+ "p697": 387,
390
+ "p685": 388,
391
+ "p310": 389,
392
+ "p316": 390,
393
+ "p312": 391,
394
+ "p298": 392,
395
+ "p295": 393,
396
+ "p705": 394,
397
+ "p703": 395,
398
+ "p702": 396,
399
+ "p699": 397,
400
+ "p678": 398,
401
+ "p283": 399,
402
+ "p282": 400,
403
+ "p281": 401,
404
+ "p280": 402,
405
+ "p278": 403,
406
+ "p717": 404,
407
+ "p322": 405,
408
+ "p300": 406,
409
+ "p710": 407,
410
+ "p701": 408,
411
+ "p695": 409,
412
+ "p681": 410,
413
+ "p301": 411,
414
+ "p291": 412,
415
+ "<pad413>": 413,
416
+ "<pad414>": 414,
417
+ "<pad415>": 415
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
418
  }
vocab.trg.4.json CHANGED
@@ -3,532 +3,532 @@
3
  "<unk>": 1,
4
  "<s>": 2,
5
  "</s>": 3,
6
- "p483": 4,
7
- "p482": 5,
8
- "p500": 6,
9
  "p496": 7,
10
- "p518": 8,
11
- "p477": 9,
12
- "p485": 10,
13
- "p488": 11,
14
- "p487": 12,
15
- "p493": 13,
16
  "p481": 14,
17
- "p503": 15,
18
- "p517": 16,
19
- "p476": 17,
20
- "p490": 18,
21
- "p515": 19,
22
- "p520": 20,
23
- "p484": 21,
24
- "p523": 22,
25
- "p495": 23,
26
- "p525": 24,
27
- "p489": 25,
28
- "p524": 26,
29
- "p498": 27,
30
- "p486": 28,
31
- "p494": 29,
32
- "p497": 30,
33
- "p526": 31,
34
- "p519": 32,
35
- "p491": 33,
36
- "p521": 34,
37
- "p522": 35,
38
- "p505": 36,
39
- "p504": 37,
40
- "p527": 38,
41
- "p499": 39,
42
- "p492": 40,
43
- "p528": 41,
44
- "p506": 42,
45
- "p531": 43,
46
- "p530": 44,
47
- "p501": 45,
48
- "p478": 46,
49
- "p480": 47,
50
- "p529": 48,
51
- "p502": 49,
52
- "p510": 50,
53
- "p508": 51,
54
- "p532": 52,
55
- "p479": 53,
56
- "p511": 54,
57
- "p475": 55,
58
- "p516": 56,
59
- "p507": 57,
60
- "p509": 58,
61
- "p514": 59,
62
- "p512": 60,
63
- "p533": 61,
64
- "p513": 62,
65
- "p534": 63,
66
- "p474": 64,
67
- "p535": 65,
68
- "p473": 66,
69
- "p536": 67,
70
- "p537": 68,
71
- "p538": 69,
72
- "p472": 70,
73
- "p471": 71,
74
- "p470": 72,
75
- "p469": 73,
76
- "p539": 74,
77
- "p468": 75,
78
- "p540": 76,
79
- "p541": 77,
80
- "p542": 78,
81
- "p543": 79,
82
- "p544": 80,
83
- "p467": 81,
84
- "p545": 82,
85
- "p466": 83,
86
- "p546": 84,
87
- "p550": 85,
88
- "p548": 86,
89
- "p547": 87,
90
- "p549": 88,
91
- "p465": 89,
92
- "p464": 90,
93
- "p551": 91,
94
- "p552": 92,
95
  "p553": 93,
96
- "p554": 94,
97
- "p463": 95,
98
- "p557": 96,
99
- "p555": 97,
100
- "p556": 98,
101
- "p462": 99,
102
- "p558": 100,
103
- "p559": 101,
104
- "p560": 102,
105
- "p561": 103,
106
- "p461": 104,
107
- "p562": 105,
108
- "p564": 106,
109
- "p563": 107,
110
- "p565": 108,
111
- "p460": 109,
112
- "p566": 110,
113
- "p567": 111,
114
- "p568": 112,
115
- "p569": 113,
116
- "p570": 114,
117
- "p459": 115,
118
- "p457": 116,
119
- "p571": 117,
120
- "p573": 118,
121
- "p572": 119,
122
- "p458": 120,
123
- "p574": 121,
124
- "p575": 122,
125
- "p576": 123,
126
- "p456": 124,
127
- "p577": 125,
128
- "p578": 126,
129
- "p454": 127,
130
- "p455": 128,
131
- "p579": 129,
132
- "p580": 130,
133
- "p582": 131,
134
- "p581": 132,
135
- "p453": 133,
136
- "p452": 134,
137
- "p450": 135,
138
- "p583": 136,
139
- "p584": 137,
140
- "p585": 138,
141
- "p451": 139,
142
- "p586": 140,
143
- "p587": 141,
144
- "p589": 142,
145
- "p449": 143,
146
- "p588": 144,
147
- "p591": 145,
148
- "p447": 146,
149
- "p590": 147,
150
- "p448": 148,
151
- "p592": 149,
152
- "p593": 150,
153
- "p442": 151,
154
- "p446": 152,
155
- "p594": 153,
156
- "p596": 154,
157
- "p445": 155,
158
- "p595": 156,
159
- "p444": 157,
160
- "p441": 158,
161
- "p597": 159,
162
- "p443": 160,
163
- "p598": 161,
164
- "p438": 162,
165
- "p432": 163,
166
- "p599": 164,
167
- "p439": 165,
168
- "p440": 166,
169
- "p437": 167,
170
- "p600": 168,
171
- "p434": 169,
172
- "p436": 170,
173
- "p602": 171,
174
- "p601": 172,
175
- "p433": 173,
176
- "p435": 174,
177
- "p604": 175,
178
- "p603": 176,
179
- "p431": 177,
180
- "p605": 178,
181
- "p606": 179,
182
- "p428": 180,
183
- "p607": 181,
184
- "p609": 182,
185
- "p427": 183,
186
- "p429": 184,
187
- "p430": 185,
188
- "p426": 186,
189
- "p610": 187,
190
- "p608": 188,
191
- "p425": 189,
192
- "p424": 190,
193
- "p611": 191,
194
- "p422": 192,
195
- "p421": 193,
196
- "p420": 194,
197
- "p423": 195,
198
- "p417": 196,
199
- "p612": 197,
200
- "p614": 198,
201
- "p613": 199,
202
- "p419": 200,
203
- "p615": 201,
204
- "p415": 202,
205
- "p418": 203,
206
- "p416": 204,
207
- "p616": 205,
208
- "p414": 206,
209
- "p617": 207,
210
- "p619": 208,
211
- "p618": 209,
212
- "p620": 210,
213
- "p412": 211,
214
- "p621": 212,
215
- "p413": 213,
216
- "p406": 214,
217
- "p409": 215,
218
- "p407": 216,
219
- "p622": 217,
220
- "p408": 218,
221
- "p410": 219,
222
- "p411": 220,
223
- "p405": 221,
224
- "p404": 222,
225
- "p400": 223,
226
- "p623": 224,
227
- "p403": 225,
228
- "p624": 226,
229
- "p397": 227,
230
- "p402": 228,
231
- "p625": 229,
232
- "p401": 230,
233
- "p626": 231,
234
- "p395": 232,
235
- "p627": 233,
236
- "p398": 234,
237
- "p399": 235,
238
- "p396": 236,
239
- "p628": 237,
240
- "p394": 238,
241
- "p632": 239,
242
- "p631": 240,
243
- "p629": 241,
244
- "p630": 242,
245
- "p393": 243,
246
- "p389": 244,
247
- "p392": 245,
248
- "p391": 246,
249
- "p633": 247,
250
- "p388": 248,
251
- "p636": 249,
252
- "p634": 250,
253
- "p638": 251,
254
- "p390": 252,
255
- "p384": 253,
256
- "p385": 254,
257
- "p635": 255,
258
- "p386": 256,
259
- "p637": 257,
260
- "p387": 258,
261
- "p642": 259,
262
- "p380": 260,
263
- "p382": 261,
264
- "p383": 262,
265
- "p639": 263,
266
- "p381": 264,
267
  "p641": 265,
268
- "p379": 266,
269
- "p640": 267,
270
- "p646": 268,
271
- "p645": 269,
272
- "p643": 270,
273
- "p374": 271,
274
- "p377": 272,
275
- "p378": 273,
276
- "p644": 274,
277
- "p653": 275,
278
- "p647": 276,
279
- "p376": 277,
280
- "p367": 278,
281
- "p369": 279,
282
- "p366": 280,
283
- "p368": 281,
284
- "p372": 282,
285
- "p375": 283,
286
- "p649": 284,
287
- "p370": 285,
288
- "p675": 286,
289
- "p650": 287,
290
- "p648": 288,
291
- "p365": 289,
292
- "p371": 290,
293
- "p654": 291,
294
- "p363": 292,
295
- "p373": 293,
296
- "p664": 294,
297
- "p331": 295,
298
- "p362": 296,
299
- "p364": 297,
300
- "p655": 298,
301
- "p652": 299,
302
- "p360": 300,
303
- "p352": 301,
304
- "p672": 302,
305
- "p359": 303,
306
- "p663": 304,
307
- "p657": 305,
308
- "p661": 306,
309
- "p361": 307,
310
- "p665": 308,
311
- "p651": 309,
312
- "p656": 310,
313
- "p355": 311,
314
- "p662": 312,
315
- "p658": 313,
316
- "p674": 314,
317
- "p659": 315,
318
- "p356": 316,
319
- "p668": 317,
320
- "p671": 318,
321
- "p358": 319,
322
- "p660": 320,
323
- "p669": 321,
324
- "p666": 322,
325
- "p670": 323,
326
- "p676": 324,
327
- "p673": 325,
328
- "p344": 326,
329
- "p677": 327,
330
- "p696": 328,
331
- "p350": 329,
332
- "p288": 330,
333
- "p357": 331,
334
- "p353": 332,
335
- "p351": 333,
336
- "p347": 334,
337
- "p309": 335,
338
- "p345": 336,
339
- "p354": 337,
340
- "p718": 338,
341
- "p341": 339,
342
- "p330": 340,
343
- "p335": 341,
344
- "p678": 342,
345
- "p334": 343,
346
- "p667": 344,
347
- "p328": 345,
348
- "p349": 346,
349
- "p332": 347,
350
- "p337": 348,
351
- "p348": 349,
352
- "p338": 350,
353
- "p327": 351,
354
- "p679": 352,
355
- "p333": 353,
356
- "p346": 354,
357
- "p336": 355,
358
- "p343": 356,
359
- "p340": 357,
360
- "p681": 358,
361
- "p682": 359,
362
- "p339": 360,
363
- "p342": 361,
364
- "p324": 362,
365
- "p680": 363,
366
- "p329": 364,
367
- "p710": 365,
368
- "p711": 366,
369
- "p326": 367,
370
- "p325": 368,
371
- "p692": 369,
372
- "p683": 370,
373
- "p323": 371,
374
- "p295": 372,
375
- "p702": 373,
376
- "p761": 374,
377
  "p703": 375,
378
- "p691": 376,
379
- "p709": 377,
380
- "p296": 378,
381
- "p245": 379,
382
- "p294": 380,
383
- "p707": 381,
384
- "p685": 382,
385
- "p712": 383,
386
- "p688": 384,
387
- "p706": 385,
388
- "p303": 386,
389
- "p708": 387,
390
- "p700": 388,
391
- "p297": 389,
392
- "p705": 390,
393
- "p302": 391,
394
- "p704": 392,
395
- "p304": 393,
396
- "p300": 394,
397
- "p298": 395,
398
- "p305": 396,
399
- "p701": 397,
400
- "p697": 398,
401
- "p291": 399,
402
- "p684": 400,
403
- "p693": 401,
404
- "p687": 402,
405
- "p686": 403,
406
- "p714": 404,
407
- "p699": 405,
408
- "p299": 406,
409
  "p694": 407,
410
- "p308": 408,
411
- "p301": 409,
412
- "p320": 410,
413
- "p695": 411,
414
- "p311": 412,
415
- "p306": 413,
416
  "p690": 414,
417
- "p689": 415,
418
- "p713": 416,
419
- "p314": 417,
420
- "p698": 418,
421
- "p312": 419,
422
- "p322": 420,
423
- "p310": 421,
424
- "p293": 422,
425
- "p717": 423,
426
- "p321": 424,
427
- "p307": 425,
428
- "p319": 426,
429
- "p313": 427,
430
- "p292": 428,
431
- "p318": 429,
432
- "p715": 430,
433
- "p315": 431,
434
- "p290": 432,
435
- "p317": 433,
436
- "p316": 434,
437
- "p289": 435,
438
  "p716": 436,
439
  "p280": 437,
440
- "p724": 438,
441
- "p720": 439,
442
  "p726": 440,
443
- "p725": 441,
444
- "p287": 442,
445
  "p719": 443,
446
- "p284": 444,
447
- "p723": 445,
448
- "p285": 446,
449
- "p729": 447,
450
- "p279": 448,
451
- "p727": 449,
452
- "p721": 450,
453
- "p282": 451,
454
- "p278": 452,
455
  "p286": 453,
456
- "p276": 454,
457
- "p731": 455,
458
- "p270": 456,
459
- "p728": 457,
460
- "p722": 458,
461
  "p271": 459,
462
- "p730": 460,
463
  "p736": 461,
464
- "p281": 462,
465
- "p269": 463,
466
  "p283": 464,
467
- "p735": 465,
468
- "p740": 466,
469
- "p734": 467,
470
- "p732": 468,
471
- "p739": 469,
472
- "p272": 470,
473
- "p737": 471,
474
- "p275": 472,
475
  "p273": 473,
476
  "p274": 474,
477
- "p733": 475,
478
- "p742": 476,
479
- "p268": 477,
480
- "p263": 478,
481
- "p277": 479,
482
- "p267": 480,
483
- "p738": 481,
484
- "p266": 482,
485
- "p743": 483,
486
- "p746": 484,
487
- "p261": 485,
488
  "p745": 486,
489
  "p744": 487,
490
- "p741": 488,
491
- "p265": 489,
492
- "p259": 490,
493
- "p748": 491,
494
- "p262": 492,
495
- "p747": 493,
496
- "p260": 494,
497
- "p749": 495,
498
- "p258": 496,
499
- "p264": 497,
500
  "p257": 498,
501
  "p755": 499,
502
- "p757": 500,
503
- "p751": 501,
504
- "p760": 502,
505
- "p753": 503,
506
- "p253": 504,
507
- "p251": 505,
508
- "p248": 506,
509
- "p756": 507,
510
- "p255": 508,
511
- "p246": 509,
512
  "p256": 510,
513
  "p759": 511,
514
  "p247": 512,
515
  "p244": 513,
516
  "p252": 514,
517
  "p764": 515,
518
- "p758": 516,
519
- "p254": 517,
520
- "p763": 518,
521
  "p752": 519,
522
- "p765": 520,
523
- "p250": 521,
524
- "p249": 522,
525
- "p766": 523,
526
- "p750": 524,
527
- "p242": 525,
528
- "p226": 526,
529
- "p754": 527,
530
- "p243": 528,
531
- "p781": 529,
532
  "p241": 530,
533
  "p240": 531,
534
  "p234": 532,
@@ -538,68 +538,68 @@
538
  "p774": 536,
539
  "p239": 537,
540
  "p227": 538,
541
- "p786": 539,
542
- "p767": 540,
543
- "p762": 541,
544
- "p233": 542,
545
- "p223": 543,
546
- "p778": 544,
547
- "p771": 545,
548
- "p770": 546,
549
- "p236": 547,
550
- "p231": 548,
551
- "p788": 549,
552
- "p782": 550,
553
- "p779": 551,
554
- "p215": 552,
555
- "p789": 553,
556
- "p784": 554,
557
- "p232": 555,
558
- "p802": 556,
559
- "p775": 557,
560
- "p769": 558,
561
- "p768": 559,
562
- "p235": 560,
563
- "p200": 561,
564
- "p772": 562,
565
- "p220": 563,
566
- "p217": 564,
567
- "p208": 565,
568
- "p808": 566,
569
- "p799": 567,
570
- "p798": 568,
571
- "p792": 569,
572
- "p791": 570,
573
- "p218": 571,
574
- "p216": 572,
575
- "p207": 573,
576
- "p203": 574,
577
- "p809": 575,
578
- "p790": 576,
579
- "p229": 577,
580
- "p195": 578,
581
- "p801": 579,
582
- "p800": 580,
583
- "p794": 581,
584
- "p785": 582,
585
- "p780": 583,
586
- "p776": 584,
587
- "p237": 585,
588
- "p230": 586,
589
- "p214": 587,
590
- "p204": 588,
591
- "p201": 589,
592
- "p787": 590,
593
- "p773": 591,
594
- "p221": 592,
595
- "p219": 593,
596
- "p213": 594,
597
- "p210": 595,
598
- "p197": 596,
599
- "p193": 597,
600
- "p188": 598,
601
- "p183": 599,
602
- "p811": 600,
603
  "p783": 601,
604
  "p777": 602,
605
  "p222": 603,
@@ -623,69 +623,69 @@
623
  "p198": 621,
624
  "p171": 622,
625
  "p834": 623,
626
- "p829": 624,
627
- "p828": 625,
628
- "p823": 626,
629
- "p816": 627,
630
- "p796": 628,
631
- "p178": 629,
632
- "p172": 630,
633
- "p846": 631,
634
- "p833": 632,
635
- "p827": 633,
636
- "p820": 634,
637
- "p819": 635,
638
- "p813": 636,
639
- "p807": 637,
640
- "p803": 638,
641
- "p797": 639,
642
- "p192": 640,
643
- "p191": 641,
644
- "p190": 642,
645
- "p189": 643,
646
- "p184": 644,
647
- "p177": 645,
648
- "p151": 646,
649
- "p848": 647,
650
- "p835": 648,
651
- "p822": 649,
652
- "p818": 650,
653
- "p187": 651,
654
- "p170": 652,
655
- "p160": 653,
656
- "p858": 654,
657
- "p855": 655,
658
- "p843": 656,
659
- "p841": 657,
660
- "p836": 658,
661
- "p825": 659,
662
- "p824": 660,
663
- "p821": 661,
664
- "p817": 662,
665
- "p815": 663,
666
- "p182": 664,
667
- "p181": 665,
668
- "p180": 666,
669
- "p179": 667,
670
- "p176": 668,
671
- "p173": 669,
672
- "p168": 670,
673
- "p163": 671,
674
- "p161": 672,
675
- "p159": 673,
676
- "p158": 674,
677
- "p156": 675,
678
- "p148": 676,
679
- "p891": 677,
680
- "p866": 678,
681
- "p860": 679,
682
- "p844": 680,
683
- "p839": 681,
684
- "p838": 682,
685
- "p837": 683,
686
- "p832": 684,
687
- "p831": 685,
688
- "p830": 686,
689
  "p814": 687,
690
  "p185": 688,
691
  "p174": 689,
 
3
  "<unk>": 1,
4
  "<s>": 2,
5
  "</s>": 3,
6
+ "p500": 4,
7
+ "p483": 5,
8
+ "p482": 6,
9
  "p496": 7,
10
+ "p477": 8,
11
+ "p485": 9,
12
+ "p488": 10,
13
+ "p487": 11,
14
+ "p493": 12,
15
+ "p503": 13,
16
  "p481": 14,
17
+ "p476": 15,
18
+ "p490": 16,
19
+ "p484": 17,
20
+ "p498": 18,
21
+ "p495": 19,
22
+ "p489": 20,
23
+ "p497": 21,
24
+ "p494": 22,
25
+ "p486": 23,
26
+ "p491": 24,
27
+ "p505": 25,
28
+ "p504": 26,
29
+ "p499": 27,
30
+ "p492": 28,
31
+ "p506": 29,
32
+ "p501": 30,
33
+ "p480": 31,
34
+ "p478": 32,
35
+ "p502": 33,
36
+ "p475": 34,
37
+ "p479": 35,
38
+ "p510": 36,
39
+ "p507": 37,
40
+ "p509": 38,
41
+ "p508": 39,
42
+ "p474": 40,
43
+ "p511": 41,
44
+ "p512": 42,
45
+ "p473": 43,
46
+ "p518": 44,
47
+ "p520": 45,
48
+ "p519": 46,
49
+ "p472": 47,
50
+ "p471": 48,
51
+ "p513": 49,
52
+ "p470": 50,
53
+ "p521": 51,
54
+ "p517": 52,
55
+ "p514": 53,
56
+ "p522": 54,
57
+ "p523": 55,
58
+ "p468": 56,
59
+ "p516": 57,
60
+ "p469": 58,
61
+ "p526": 59,
62
+ "p515": 60,
63
+ "p525": 61,
64
+ "p531": 62,
65
+ "p524": 63,
66
+ "p530": 64,
67
+ "p527": 65,
68
+ "p528": 66,
69
+ "p467": 67,
70
+ "p529": 68,
71
+ "p532": 69,
72
+ "p533": 70,
73
+ "p466": 71,
74
+ "p534": 72,
75
+ "p538": 73,
76
+ "p535": 74,
77
+ "p536": 75,
78
+ "p537": 76,
79
+ "p465": 77,
80
+ "p464": 78,
81
+ "p539": 79,
82
+ "p543": 80,
83
+ "p540": 81,
84
+ "p541": 82,
85
+ "p542": 83,
86
+ "p463": 84,
87
+ "p544": 85,
88
+ "p462": 86,
89
+ "p545": 87,
90
+ "p548": 88,
91
+ "p546": 89,
92
+ "p547": 90,
93
+ "p549": 91,
94
+ "p550": 92,
95
  "p553": 93,
96
+ "p552": 94,
97
+ "p461": 95,
98
+ "p551": 96,
99
+ "p460": 97,
100
+ "p554": 98,
101
+ "p555": 99,
102
+ "p556": 100,
103
+ "p459": 101,
104
+ "p557": 102,
105
+ "p457": 103,
106
+ "p558": 104,
107
+ "p560": 105,
108
+ "p559": 106,
109
+ "p458": 107,
110
+ "p561": 108,
111
+ "p562": 109,
112
+ "p456": 110,
113
+ "p563": 111,
114
+ "p564": 112,
115
+ "p454": 113,
116
+ "p565": 114,
117
+ "p567": 115,
118
+ "p455": 116,
119
+ "p566": 117,
120
+ "p453": 118,
121
+ "p450": 119,
122
+ "p452": 120,
123
+ "p568": 121,
124
+ "p569": 122,
125
+ "p570": 123,
126
+ "p571": 124,
127
+ "p451": 125,
128
+ "p573": 126,
129
+ "p572": 127,
130
+ "p574": 128,
131
+ "p449": 129,
132
+ "p575": 130,
133
+ "p447": 131,
134
+ "p448": 132,
135
+ "p577": 133,
136
+ "p576": 134,
137
+ "p578": 135,
138
+ "p442": 136,
139
+ "p446": 137,
140
+ "p579": 138,
141
+ "p445": 139,
142
+ "p580": 140,
143
+ "p441": 141,
144
+ "p444": 142,
145
+ "p443": 143,
146
+ "p438": 144,
147
+ "p581": 145,
148
+ "p439": 146,
149
+ "p432": 147,
150
+ "p582": 148,
151
+ "p583": 149,
152
+ "p440": 150,
153
+ "p437": 151,
154
+ "p434": 152,
155
+ "p584": 153,
156
+ "p585": 154,
157
+ "p433": 155,
158
+ "p436": 156,
159
+ "p435": 157,
160
+ "p586": 158,
161
+ "p589": 159,
162
+ "p587": 160,
163
+ "p431": 161,
164
+ "p591": 162,
165
+ "p588": 163,
166
+ "p428": 164,
167
+ "p590": 165,
168
+ "p429": 166,
169
+ "p592": 167,
170
+ "p427": 168,
171
+ "p430": 169,
172
+ "p426": 170,
173
+ "p593": 171,
174
+ "p594": 172,
175
+ "p595": 173,
176
+ "p424": 174,
177
+ "p425": 175,
178
+ "p421": 176,
179
+ "p422": 177,
180
+ "p417": 178,
181
+ "p596": 179,
182
+ "p420": 180,
183
+ "p423": 181,
184
+ "p597": 182,
185
+ "p599": 183,
186
+ "p598": 184,
187
+ "p419": 185,
188
+ "p600": 186,
189
+ "p601": 187,
190
+ "p602": 188,
191
+ "p415": 189,
192
+ "p604": 190,
193
+ "p418": 191,
194
+ "p416": 192,
195
+ "p414": 193,
196
+ "p603": 194,
197
+ "p605": 195,
198
+ "p412": 196,
199
+ "p413": 197,
200
+ "p606": 198,
201
+ "p607": 199,
202
+ "p407": 200,
203
+ "p406": 201,
204
+ "p409": 202,
205
+ "p610": 203,
206
+ "p609": 204,
207
+ "p405": 205,
208
+ "p404": 206,
209
+ "p408": 207,
210
+ "p410": 208,
211
+ "p608": 209,
212
+ "p611": 210,
213
+ "p411": 211,
214
+ "p400": 212,
215
+ "p403": 213,
216
+ "p397": 214,
217
+ "p402": 215,
218
+ "p395": 216,
219
+ "p401": 217,
220
+ "p398": 218,
221
+ "p396": 219,
222
+ "p399": 220,
223
+ "p394": 221,
224
+ "p612": 222,
225
+ "p614": 223,
226
+ "p613": 224,
227
+ "p615": 225,
228
+ "p393": 226,
229
+ "p392": 227,
230
+ "p617": 228,
231
+ "p618": 229,
232
+ "p616": 230,
233
+ "p389": 231,
234
+ "p391": 232,
235
+ "p619": 233,
236
+ "p621": 234,
237
+ "p620": 235,
238
+ "p388": 236,
239
+ "p632": 237,
240
+ "p622": 238,
241
+ "p385": 239,
242
+ "p384": 240,
243
+ "p390": 241,
244
+ "p623": 242,
245
+ "p386": 243,
246
+ "p380": 244,
247
+ "p624": 245,
248
+ "p627": 246,
249
+ "p387": 247,
250
+ "p382": 248,
251
+ "p626": 249,
252
+ "p625": 250,
253
+ "p374": 251,
254
+ "p383": 252,
255
+ "p628": 253,
256
+ "p381": 254,
257
+ "p379": 255,
258
+ "p633": 256,
259
+ "p378": 257,
260
+ "p377": 258,
261
+ "p631": 259,
262
+ "p629": 260,
263
+ "p630": 261,
264
+ "p634": 262,
265
+ "p636": 263,
266
+ "p638": 264,
267
  "p641": 265,
268
+ "p642": 266,
269
+ "p376": 267,
270
+ "p367": 268,
271
+ "p637": 269,
272
+ "p331": 270,
273
+ "p368": 271,
274
+ "p369": 272,
275
+ "p366": 273,
276
+ "p675": 274,
277
+ "p635": 275,
278
+ "p640": 276,
279
+ "p372": 277,
280
+ "p370": 278,
281
+ "p653": 279,
282
+ "p375": 280,
283
+ "p365": 281,
284
+ "p643": 282,
285
+ "p639": 283,
286
+ "p363": 284,
287
+ "p371": 285,
288
+ "p373": 286,
289
+ "p362": 287,
290
+ "p352": 288,
291
+ "p645": 289,
292
+ "p364": 290,
293
+ "p360": 291,
294
+ "p646": 292,
295
+ "p644": 293,
296
+ "p361": 294,
297
+ "p359": 295,
298
+ "p647": 296,
299
+ "p650": 297,
300
+ "p355": 298,
301
+ "p672": 299,
302
+ "p649": 300,
303
+ "p654": 301,
304
+ "p674": 302,
305
+ "p356": 303,
306
+ "p358": 304,
307
+ "p288": 305,
308
+ "p664": 306,
309
+ "p661": 307,
310
+ "p655": 308,
311
+ "p652": 309,
312
+ "p648": 310,
313
+ "p309": 311,
314
+ "p658": 312,
315
+ "p665": 313,
316
+ "p668": 314,
317
+ "p344": 315,
318
+ "p696": 316,
319
+ "p659": 317,
320
+ "p350": 318,
321
+ "p330": 319,
322
+ "p662": 320,
323
+ "p341": 321,
324
+ "p676": 322,
325
+ "p334": 323,
326
+ "p657": 324,
327
+ "p671": 325,
328
+ "p718": 326,
329
+ "p347": 327,
330
+ "p335": 328,
331
+ "p332": 329,
332
+ "p351": 330,
333
+ "p345": 331,
334
+ "p357": 332,
335
+ "p328": 333,
336
+ "p348": 334,
337
+ "p353": 335,
338
+ "p656": 336,
339
+ "p673": 337,
340
+ "p660": 338,
341
+ "p354": 339,
342
+ "p651": 340,
343
+ "p677": 341,
344
+ "p327": 342,
345
+ "p337": 343,
346
+ "p333": 344,
347
+ "p663": 345,
348
+ "p338": 346,
349
+ "p670": 347,
350
+ "p346": 348,
351
+ "p669": 349,
352
+ "p349": 350,
353
+ "p678": 351,
354
+ "p340": 352,
355
+ "p336": 353,
356
+ "p343": 354,
357
+ "p339": 355,
358
+ "p324": 356,
359
+ "p667": 357,
360
+ "p666": 358,
361
+ "p342": 359,
362
+ "p329": 360,
363
+ "p682": 361,
364
+ "p679": 362,
365
+ "p710": 363,
366
+ "p326": 364,
367
+ "p681": 365,
368
+ "p680": 366,
369
+ "p711": 367,
370
+ "p295": 368,
371
+ "p325": 369,
372
+ "p323": 370,
373
+ "p761": 371,
374
+ "p296": 372,
375
+ "p245": 373,
376
+ "p294": 374,
377
  "p703": 375,
378
+ "p709": 376,
379
+ "p712": 377,
380
+ "p303": 378,
381
+ "p302": 379,
382
+ "p297": 380,
383
+ "p702": 381,
384
+ "p706": 382,
385
+ "p707": 383,
386
+ "p304": 384,
387
+ "p298": 385,
388
+ "p708": 386,
389
+ "p300": 387,
390
+ "p704": 388,
391
+ "p705": 389,
392
+ "p291": 390,
393
+ "p305": 391,
394
+ "p700": 392,
395
+ "p692": 393,
396
+ "p714": 394,
397
+ "p299": 395,
398
+ "p301": 396,
399
+ "p683": 397,
400
+ "p701": 398,
401
+ "p685": 399,
402
+ "p697": 400,
403
+ "p308": 401,
404
+ "p306": 402,
405
+ "p320": 403,
406
+ "p693": 404,
407
+ "p311": 405,
408
+ "p699": 406,
409
  "p694": 407,
410
+ "p314": 408,
411
+ "p684": 409,
412
+ "p293": 410,
413
+ "p322": 411,
414
+ "p312": 412,
415
+ "p713": 413,
416
  "p690": 414,
417
+ "p310": 415,
418
+ "p688": 416,
419
+ "p292": 417,
420
+ "p321": 418,
421
+ "p313": 419,
422
+ "p687": 420,
423
+ "p686": 421,
424
+ "p695": 422,
425
+ "p319": 423,
426
+ "p698": 424,
427
+ "p691": 425,
428
+ "p307": 426,
429
+ "p717": 427,
430
+ "p689": 428,
431
+ "p290": 429,
432
+ "p315": 430,
433
+ "p318": 431,
434
+ "p316": 432,
435
+ "p715": 433,
436
+ "p289": 434,
437
+ "p317": 435,
438
  "p716": 436,
439
  "p280": 437,
440
+ "p725": 438,
441
+ "p287": 439,
442
  "p726": 440,
443
+ "p724": 441,
444
+ "p284": 442,
445
  "p719": 443,
446
+ "p720": 444,
447
+ "p285": 445,
448
+ "p279": 446,
449
+ "p721": 447,
450
+ "p282": 448,
451
+ "p278": 449,
452
+ "p729": 450,
453
+ "p276": 451,
454
+ "p723": 452,
455
  "p286": 453,
456
+ "p727": 454,
457
+ "p728": 455,
458
+ "p281": 456,
459
+ "p270": 457,
460
+ "p269": 458,
461
  "p271": 459,
462
+ "p722": 460,
463
  "p736": 461,
464
+ "p735": 462,
465
+ "p731": 463,
466
  "p283": 464,
467
+ "p730": 465,
468
+ "p732": 466,
469
+ "p272": 467,
470
+ "p737": 468,
471
+ "p275": 469,
472
+ "p734": 470,
473
+ "p733": 471,
474
+ "p739": 472,
475
  "p273": 473,
476
  "p274": 474,
477
+ "p268": 475,
478
+ "p263": 476,
479
+ "p277": 477,
480
+ "p267": 478,
481
+ "p742": 479,
482
+ "p738": 480,
483
+ "p266": 481,
484
+ "p746": 482,
485
+ "p261": 483,
486
+ "p740": 484,
487
+ "p743": 485,
488
  "p745": 486,
489
  "p744": 487,
490
+ "p265": 488,
491
+ "p259": 489,
492
+ "p262": 490,
493
+ "p741": 491,
494
+ "p260": 492,
495
+ "p748": 493,
496
+ "p258": 494,
497
+ "p747": 495,
498
+ "p264": 496,
499
+ "p749": 497,
500
  "p257": 498,
501
  "p755": 499,
502
+ "p751": 500,
503
+ "p760": 501,
504
+ "p253": 502,
505
+ "p251": 503,
506
+ "p248": 504,
507
+ "p757": 505,
508
+ "p756": 506,
509
+ "p255": 507,
510
+ "p246": 508,
511
+ "p753": 509,
512
  "p256": 510,
513
  "p759": 511,
514
  "p247": 512,
515
  "p244": 513,
516
  "p252": 514,
517
  "p764": 515,
518
+ "p254": 516,
519
+ "p763": 517,
520
+ "p758": 518,
521
  "p752": 519,
522
+ "p250": 520,
523
+ "p249": 521,
524
+ "p766": 522,
525
+ "p750": 523,
526
+ "p242": 524,
527
+ "p226": 525,
528
+ "p754": 526,
529
+ "p243": 527,
530
+ "p781": 528,
531
+ "p765": 529,
532
  "p241": 530,
533
  "p240": 531,
534
  "p234": 532,
 
538
  "p774": 536,
539
  "p239": 537,
540
  "p227": 538,
541
+ "p767": 539,
542
+ "p762": 540,
543
+ "p233": 541,
544
+ "p223": 542,
545
+ "p778": 543,
546
+ "p771": 544,
547
+ "p770": 545,
548
+ "p236": 546,
549
+ "p231": 547,
550
+ "p786": 548,
551
+ "p782": 549,
552
+ "p779": 550,
553
+ "p215": 551,
554
+ "p789": 552,
555
+ "p232": 553,
556
+ "p802": 554,
557
+ "p775": 555,
558
+ "p769": 556,
559
+ "p768": 557,
560
+ "p235": 558,
561
+ "p200": 559,
562
+ "p784": 560,
563
+ "p772": 561,
564
+ "p220": 562,
565
+ "p217": 563,
566
+ "p208": 564,
567
+ "p808": 565,
568
+ "p799": 566,
569
+ "p798": 567,
570
+ "p792": 568,
571
+ "p791": 569,
572
+ "p218": 570,
573
+ "p216": 571,
574
+ "p207": 572,
575
+ "p203": 573,
576
+ "p790": 574,
577
+ "p229": 575,
578
+ "p195": 576,
579
+ "p801": 577,
580
+ "p800": 578,
581
+ "p794": 579,
582
+ "p785": 580,
583
+ "p780": 581,
584
+ "p776": 582,
585
+ "p237": 583,
586
+ "p230": 584,
587
+ "p214": 585,
588
+ "p204": 586,
589
+ "p201": 587,
590
+ "p809": 588,
591
+ "p787": 589,
592
+ "p773": 590,
593
+ "p221": 591,
594
+ "p219": 592,
595
+ "p213": 593,
596
+ "p210": 594,
597
+ "p197": 595,
598
+ "p193": 596,
599
+ "p188": 597,
600
+ "p183": 598,
601
+ "p811": 599,
602
+ "p788": 600,
603
  "p783": 601,
604
  "p777": 602,
605
  "p222": 603,
 
623
  "p198": 621,
624
  "p171": 622,
625
  "p834": 623,
626
+ "p828": 624,
627
+ "p823": 625,
628
+ "p816": 626,
629
+ "p796": 627,
630
+ "p178": 628,
631
+ "p172": 629,
632
+ "p846": 630,
633
+ "p833": 631,
634
+ "p827": 632,
635
+ "p820": 633,
636
+ "p819": 634,
637
+ "p813": 635,
638
+ "p807": 636,
639
+ "p803": 637,
640
+ "p797": 638,
641
+ "p192": 639,
642
+ "p191": 640,
643
+ "p190": 641,
644
+ "p189": 642,
645
+ "p184": 643,
646
+ "p177": 644,
647
+ "p151": 645,
648
+ "p848": 646,
649
+ "p835": 647,
650
+ "p822": 648,
651
+ "p818": 649,
652
+ "p187": 650,
653
+ "p170": 651,
654
+ "p160": 652,
655
+ "p858": 653,
656
+ "p855": 654,
657
+ "p843": 655,
658
+ "p841": 656,
659
+ "p836": 657,
660
+ "p825": 658,
661
+ "p824": 659,
662
+ "p821": 660,
663
+ "p817": 661,
664
+ "p815": 662,
665
+ "p182": 663,
666
+ "p181": 664,
667
+ "p180": 665,
668
+ "p179": 666,
669
+ "p176": 667,
670
+ "p173": 668,
671
+ "p168": 669,
672
+ "p163": 670,
673
+ "p161": 671,
674
+ "p159": 672,
675
+ "p158": 673,
676
+ "p156": 674,
677
+ "p148": 675,
678
+ "p891": 676,
679
+ "p866": 677,
680
+ "p860": 678,
681
+ "p844": 679,
682
+ "p839": 680,
683
+ "p838": 681,
684
+ "p837": 682,
685
+ "p832": 683,
686
+ "p831": 684,
687
+ "p830": 685,
688
+ "p829": 686,
689
  "p814": 687,
690
  "p185": 688,
691
  "p174": 689,