{
"version": "1.0",
"truncation": null,
"padding": null,
"added_tokens": [
{
"id": 0,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 1,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 2,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 3,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": true,
"special": true
},
{
"id": 4,
"content": "[UNK]",
"single_word": false,
"lstrip": false,
"rstrip": false,
"normalized": false,
"special": true
},
{
"id": 5,
"content": "",
"single_word": false,
"lstrip": true,
"rstrip": false,
"normalized": false,
"special": true
}
],
"normalizer": {
"type": "BertNormalizer",
"clean_text": true,
"handle_chinese_chars": true,
"strip_accents": null,
"lowercase": true
},
"pre_tokenizer": {
"type": "BertPreTokenizer"
},
"post_processor": {
"type": "RobertaProcessing",
"sep": [
"",
2
],
"cls": [
"",
0
],
"trim_offsets": true,
"add_prefix_space": false
},
"decoder": {
"type": "WordPiece",
"prefix": "##",
"cleanup": true
},
"model": {
"type": "WordPiece",
"unk_token": "[UNK]",
"continuing_subword_prefix": "##",
"max_input_chars_per_word": 100,
"vocab": {
"": 0,
"": 1,
"": 2,
"": 3,
"[UNK]": 4,
"": 5,
"!": 6,
"\"": 7,
"#": 8,
"$": 9,
"%": 10,
"&": 11,
"'": 12,
"(": 13,
")": 14,
"*": 15,
"+": 16,
",": 17,
"-": 18,
".": 19,
"/": 20,
"0": 21,
"1": 22,
"2": 23,
"3": 24,
"4": 25,
"5": 26,
"6": 27,
"7": 28,
"8": 29,
"9": 30,
":": 31,
";": 32,
"<": 33,
"=": 34,
">": 35,
"?": 36,
"@": 37,
"[": 38,
"\\": 39,
"]": 40,
"^": 41,
"_": 42,
"`": 43,
"a": 44,
"b": 45,
"c": 46,
"d": 47,
"e": 48,
"f": 49,
"g": 50,
"h": 51,
"i": 52,
"j": 53,
"k": 54,
"l": 55,
"m": 56,
"n": 57,
"o": 58,
"p": 59,
"q": 60,
"r": 61,
"s": 62,
"t": 63,
"u": 64,
"v": 65,
"w": 66,
"x": 67,
"y": 68,
"z": 69,
"|": 70,
"}": 71,
"~": 72,
"¡": 73,
"¢": 74,
"£": 75,
"¥": 76,
"§": 77,
"°": 78,
"±": 79,
"²": 80,
"³": 81,
"´": 82,
"µ": 83,
"·": 84,
"º": 85,
"½": 86,
"¿": 87,
"×": 88,
"ß": 89,
"æ": 90,
"ð": 91,
"ø": 92,
"þ": 93,
"đ": 94,
"ħ": 95,
"ı": 96,
"ł": 97,
"œ": 98,
"ɐ": 99,
"ɑ": 100,
"ɒ": 101,
"ɔ": 102,
"ə": 103,
"ɛ": 104,
"ɜ": 105,
"ɡ": 106,
"ɢ": 107,
"ɪ": 108,
"ɫ": 109,
"ɳ": 110,
"ɽ": 111,
"ɾ": 112,
"ʁ": 113,
"ʃ": 114,
"ʊ": 115,
"ʋ": 116,
"ʒ": 117,
"ʔ": 118,
"ʕ": 119,
"ʲ": 120,
"ʻ": 121,
"ʼ": 122,
"ʾ": 123,
"ʿ": 124,
"ˈ": 125,
"ˌ": 126,
"ː": 127,
"α": 128,
"β": 129,
"γ": 130,
"δ": 131,
"ε": 132,
"η": 133,
"θ": 134,
"ι": 135,
"κ": 136,
"λ": 137,
"μ": 138,
"ν": 139,
"ξ": 140,
"ο": 141,
"π": 142,
"ρ": 143,
"ς": 144,
"σ": 145,
"τ": 146,
"υ": 147,
"φ": 148,
"χ": 149,
"ψ": 150,
"ω": 151,
"а": 152,
"б": 153,
"в": 154,
"г": 155,
"д": 156,
"е": 157,
"ж": 158,
"з": 159,
"и": 160,
"к": 161,
"л": 162,
"м": 163,
"н": 164,
"о": 165,
"п": 166,
"р": 167,
"с": 168,
"т": 169,
"у": 170,
"х": 171,
"ц": 172,
"ш": 173,
"ъ": 174,
"ы": 175,
"ь": 176,
"ю": 177,
"я": 178,
"є": 179,
"א": 180,
"ב": 181,
"ג": 182,
"ה": 183,
"ו": 184,
"ז": 185,
"ח": 186,
"י": 187,
"ל": 188,
"ם": 189,
"מ": 190,
"ן": 191,
"נ": 192,
"ס": 193,
"ף": 194,
"פ": 195,
"צ": 196,
"ר": 197,
"ש": 198,
"ת": 199,
"ء": 200,
"ا": 201,
"ب": 202,
"ة": 203,
"ت": 204,
"ث": 205,
"ج": 206,
"ح": 207,
"خ": 208,
"د": 209,
"ذ": 210,
"ر": 211,
"س": 212,
"ش": 213,
"ص": 214,
"ع": 215,
"ف": 216,
"ق": 217,
"ك": 218,
"ل": 219,
"م": 220,
"ن": 221,
"ه": 222,
"و": 223,
"ي": 224,
"ܐ": 225,
"ܕ": 226,
"ܗ": 227,
"ܝ": 228,
"ܠ": 229,
"ܢ": 230,
"ܬ": 231,
"अ": 232,
"ई": 233,
"क": 234,
"ग": 235,
"ण": 236,
"त": 237,
"द": 238,
"न": 239,
"प": 240,
"ब": 241,
"म": 242,
"य": 243,
"र": 244,
"ल": 245,
"व": 246,
"स": 247,
"ह": 248,
"ा": 249,
"ि": 250,
"আ": 251,
"ল": 252,
"হ": 253,
"া": 254,
"ਅ": 255,
"ਲ": 256,
"ਹ": 257,
"ਾ": 258,
"അ": 259,
"ള": 260,
"ഹ": 261,
"ാ": 262,
"ก": 263,
"ค": 264,
"ง": 265,
"ช": 266,
"ซ": 267,
"ญ": 268,
"ฐ": 269,
"ณ": 270,
"ด": 271,
"ต": 272,
"น": 273,
"บ": 274,
"ป": 275,
"พ": 276,
"ภ": 277,
"ม": 278,
"ย": 279,
"ร": 280,
"ล": 281,
"ว": 282,
"ศ": 283,
"ษ": 284,
"ส": 285,
"ห": 286,
"อ": 287,
"ฮ": 288,
"ะ": 289,
"า": 290,
"เ": 291,
"แ": 292,
"ไ": 293,
"ა": 294,
"ბ": 295,
"გ": 296,
"დ": 297,
"ე": 298,
"ვ": 299,
"ზ": 300,
"თ": 301,
"ი": 302,
"კ": 303,
"ლ": 304,
"მ": 305,
"ნ": 306,
"ო": 307,
"პ": 308,
"ჟ": 309,
"რ": 310,
"ს": 311,
"ტ": 312,
"უ": 313,
"ფ": 314,
"ქ": 315,
"ღ": 316,
"ყ": 317,
"შ": 318,
"ჩ": 319,
"ც": 320,
"ძ": 321,
"წ": 322,
"ჭ": 323,
"ხ": 324,
"ჯ": 325,
"ჰ": 326,
"ჱ": 327,
"ჲ": 328,
"ჳ": 329,
"ჴ": 330,
"ჵ": 331,
"ჶ": 332,
"ჷ": 333,
"ჸ": 334,
"ჹ": 335,
"ჺ": 336,
"჻": 337,
"ᄃ": 338,
"ᄅ": 339,
"ᄇ": 340,
"ᄋ": 341,
"ᄌ": 342,
"ᅡ": 343,
"ᅢ": 344,
"ᅦ": 345,
"ᅧ": 346,
"ᅩ": 347,
"ᅮ": 348,
"ᅵ": 349,
"ᆨ": 350,
"ᆫ": 351,
"ᆯ": 352,
"ᆸ": 353,
"ᆼ": 354,
"ᵻ": 355,
"‐": 356,
"‑": 357,
"–": 358,
"—": 359,
"―": 360,
"‘": 361,
"’": 362,
"“": 363,
"”": 364,
"„": 365,
"†": 366,
"‡": 367,
"•": 368,
"…": 369,
"′": 370,
"″": 371,
"⁄": 372,
"₣": 373,
"₤": 374,
"€": 375,
"₹": 376,
"⅓": 377,
"⅔": 378,
"→": 379,
"−": 380,
"≡": 381,
"≤": 382,
"①": 383,
"☉": 384,
"☫": 385,
"♀": 386,
"♭": 387,
"♯": 388,
"⚳": 389,
"ⴀ": 390,
"ⴂ": 391,
"ⴃ": 392,
"ⴈ": 393,
"ⴌ": 394,
"ⴕ": 395,
"ⴟ": 396,
"〈": 397,
"〉": 398,
"〜": 399,
"あ": 400,
"い": 401,
"う": 402,
"お": 403,
"か": 404,
"き": 405,
"く": 406,
"け": 407,
"こ": 408,
"さ": 409,
"し": 410,
"す": 411,
"せ": 412,
"た": 413,
"ち": 414,
"っ": 415,
"つ": 416,
"と": 417,
"な": 418,
"に": 419,
"の": 420,
"は": 421,
"ひ": 422,
"ふ": 423,
"ほ": 424,
"ま": 425,
"み": 426,
"め": 427,
"も": 428,
"ゃ": 429,
"ゆ": 430,
"ょ": 431,
"ら": 432,
"り": 433,
"る": 434,
"れ": 435,
"わ": 436,
"を": 437,
"ん": 438,
"ァ": 439,
"ア": 440,
"ィ": 441,
"イ": 442,
"ゥ": 443,
"ウ": 444,
"ェ": 445,
"エ": 446,
"ォ": 447,
"オ": 448,
"カ": 449,
"キ": 450,
"ク": 451,
"ケ": 452,
"コ": 453,
"サ": 454,
"シ": 455,
"ス": 456,
"セ": 457,
"タ": 458,
"チ": 459,
"ッ": 460,
"ツ": 461,
"テ": 462,
"ト": 463,
"ナ": 464,
"ニ": 465,
"ネ": 466,
"ノ": 467,
"ハ": 468,
"フ": 469,
"ヘ": 470,
"マ": 471,
"ミ": 472,
"ム": 473,
"モ": 474,
"ャ": 475,
"ュ": 476,
"ョ": 477,
"ラ": 478,
"リ": 479,
"ル": 480,
"レ": 481,
"ロ": 482,
"ン": 483,
"・": 484,
"ー": 485,
"一": 486,
"七": 487,
"下": 488,
"世": 489,
"丙": 490,
"中": 491,
"主": 492,
"乃": 493,
"之": 494,
"乙": 495,
"九": 496,
"二": 497,
"云": 498,
"人": 499,
"今": 500,
"付": 501,
"作": 502,
"侗": 503,
"依": 504,
"信": 505,
"傳": 506,
"儚": 507,
"充": 508,
"光": 509,
"全": 510,
"兵": 511,
"其": 512,
"具": 513,
"円": 514,
"再": 515,
"出": 516,
"判": 517,
"前": 518,
"剛": 519,
"劇": 520,
"劉": 521,
"動": 522,
"化": 523,
"北": 524,
"华": 525,
"厂": 526,
"去": 527,
"古": 528,
"可": 529,
"台": 530,
"史": 531,
"同": 532,
"名": 533,
"君": 534,
"吳": 535,
"周": 536,
"命": 537,
"和": 538,
"咲": 539,
"善": 540,
"四": 541,
"國": 542,
"園": 543,
"圣": 544,
"在": 545,
"坂": 546,
"堤": 547,
"場": 548,
"塘": 549,
"夕": 550,
"大": 551,
"天": 552,
"夫": 553,
"女": 554,
"妙": 555,
"姚": 556,
"子": 557,
"孟": 558,
"守": 559,
"安": 560,
"宋": 561,
"完": 562,
"宗": 563,
"宝": 564,
"宫": 565,
"寝": 566,
"寺": 567,
"小": 568,
"少": 569,
"尾": 570,
"山": 571,
"岳": 572,
"川": 573,
"州": 574,
"巳": 575,
"市": 576,
"師": 577,
"平": 578,
"广": 579,
"庆": 580,
"府": 581,
"座": 582,
"廬": 583,
"建": 584,
"式": 585,
"張": 586,
"彌": 587,
"彩": 588,
"彼": 589,
"後": 590,
"御": 591,
"德": 592,
"思": 593,
"愛": 594,
"憑": 595,
"憶": 596,
"應": 597,
"懷": 598,
"战": 599,
"戦": 600,
"扈": 601,
"技": 602,
"拉": 603,
"拳": 604,
"挑": 605,
"揺": 606,
"攻": 607,
"放": 608,
"政": 609,
"散": 610,
"斯": 611,
"方": 612,
"日": 613,
"旦": 614,
"旭": 615,
"昌": 616,
"明": 617,
"星": 618,
"春": 619,
"晋": 620,
"景": 621,
"曦": 622,
"月": 623,
"望": 624,
"未": 625,
"本": 626,
"李": 627,
"村": 628,
"杜": 629,
"束": 630,
"来": 631,
"林": 632,
"桜": 633,
"梶": 634,
"棘": 635,
"椎": 636,
"楊": 637,
"楚": 638,
"榮": 639,
"橘": 640,
"機": 641,
"正": 642,
"殻": 643,
"殿": 644,
"母": 645,
"水": 646,
"汉": 647,
"沂": 648,
"沙": 649,
"河": 650,
"泗": 651,
"波": 652,
"泣": 653,
"洪": 654,
"淹": 655,
"清": 656,
"湯": 657,
"漢": 658,
"澄": 659,
"澤": 660,
"火": 661,
"灯": 662,
"灵": 663,
"灼": 664,
"焼": 665,
"熱": 666,
"物": 667,
"狐": 668,
"狸": 669,
"玄": 670,
"王": 671,
"玩": 672,
"珂": 673,
"珙": 674,
"球": 675,
"理": 676,
"琦": 677,
"琪": 678,
"瓊": 679,
"生": 680,
"田": 681,
"畢": 682,
"番": 683,
"瘡": 684,
"白": 685,
"皮": 686,
"真": 687,
"砲": 688,
"礮": 689,
"祈": 690,
"神": 691,
"祠": 692,
"秋": 693,
"空": 694,
"立": 695,
"精": 696,
"約": 697,
"絵": 698,
"織": 699,
"義": 700,
"翠": 701,
"者": 702,
"耕": 703,
"肖": 704,
"胡": 705,
"膀": 706,
"臂": 707,
"興": 708,
"良": 709,
"花": 710,
"芳": 711,
"芽": 712,
"若": 713,
"英": 714,
"藕": 715,
"藥": 716,
"蘄": 717,
"蘇": 718,
"行": 719,
"裁": 720,
"規": 721,
"覺": 722,
"观": 723,
"解": 724,
"記": 725,
"誓": 726,
"誡": 727,
"誰": 728,
"謎": 729,
"许": 730,
"谭": 731,
"豪": 732,
"豫": 733,
"費": 734,
"贵": 735,
"赤": 736,
"趙": 737,
"足": 738,
"跡": 739,
"転": 740,
"辛": 741,
"逆": 742,
"遇": 743,
"運": 744,
"過": 745,
"遠": 746,
"選": 747,
"邦": 748,
"邱": 749,
"部": 750,
"郭": 751,
"都": 752,
"酈": 753,
"里": 754,
"野": 755,
"金": 756,
"銃": 757,
"鋼": 758,
"錄": 759,
"錡": 760,
"鍵": 761,
"鐵": 762,
"钱": 763,
"铁": 764,
"關": 765,
"防": 766,
"阿": 767,
"陈": 768,
"陳": 769,
"陽": 770,
"隊": 771,
"階": 772,
"集": 773,
"雪": 774,
"雲": 775,
"霖": 776,
"霹": 777,
"靂": 778,
"韓": 779,
"願": 780,
"顯": 781,
"颜": 782,
"马": 783,
"高": 784,
"龍": 785,
"ﷲ": 786,
"ﻋ": 787,
"/": 788,
"3": 789,
"~": 790,
"##s": 791,
"##p": 792,
"##e": 793,
"##n": 794,
"##a": 795,
"##t": 796,
"##h": 797,
"##r": 798,
"##i": 799,
"##g": 800,
"##4": 801,
"##9": 802,
"##v": 803,
"##u": 804,
"##l": 805,
"##c": 806,
"##y": 807,
"##m": 808,
"##o": 809,
"##d": 810,
"##q": 811,
"##f": 812,
"##b": 813,
"##j": 814,
"##k": 815,
"##w": 816,
"##z": 817,
"##6": 818,
"##0": 819,
"##1": 820,
"##x": 821,
"##8": 822,
"##7": 823,
"##3": 824,
"##2": 825,
"##а": 826,
"##л": 827,
"##ы": 828,
"##и": 829,
"##ル": 830,
"##ハ": 831,
"##ト": 832,
"##ス": 833,
"##5": 834,
"##р": 835,
"##с": 836,
"##н": 837,
"##ɪ": 838,
"##ʃ": 839,
"##ɑ": 840,
"##ː": 841,
"##ი": 842,
"##ウ": 843,
"##ァ": 844,
"##キ": 845,
"##ュ": 846,
"##リ": 847,
"##ア": 848,
"##う": 849,
"##き": 850,
"##ł": 851,
"##ッ": 852,
"##ク": 853,
"##マ": 854,
"##ン": 855,
"##テ": 856,
"##ィ": 857,
"##ニ": 858,
"##ー": 859,
"##ل": 860,
"##ا": 861,
"##ب": 862,
"##ن": 863,
"##ล": 864,
"##ย": 865,
"##า": 866,
"##ณ": 867,
"##ม": 868,
"##ต": 869,
"##ร": 870,
"##τ": 871,
"##ι": 872,
"##β": 873,
"##เ": 874,
"##ป": 875,
"##რ": 876,
"##გ": 877,
"##ვ": 878,
"##ლ": 879,
"##ო": 880,
"##ა": 881,
"##ნ": 882,
"##ラ": 883,
"##ъ": 884,
"##к": 885,
"##в": 886,
"##đ": 887,
"##ø": 888,
"##ɾ": 889,
"##ʲ": 890,
"##ə": 891,
"##ˈ": 892,
"##ב": 893,
"##ת": 894,
"##א": 895,
"##י": 896,
"##ك": 897,
"##ر": 898,
"##د": 899,
"##っ": 900,
"##е": 901,
"##о": 902,
"##у": 903,
"##я": 904,
"##ɔ": 905,
"##ʔ": 906,
"##ذ": 907,
"##ي": 908,
"##ة": 909,
"##ს": 910,
"##ტ": 911,
"##ე": 912,
"##サ": 913,
"##た": 914,
"##し": 915,
"##の": 916,
"##す": 917,
"##な": 918,
"##ひ": 919,
"##と": 920,
"##ן": 921,
"##レ": 922,
"##チ": 923,
"##ナ": 924,
"##უ": 925,
"##ც": 926,
"##ف": 927,
"##س": 928,
"##ɐ": 929,
"##ᅦ": 930,
"##ᄃ": 931,
"##ᅩ": 932,
"##ᆨ": 933,
"##ᄅ": 934,
"##ᅵ": 935,
"##ᆸ": 936,
"##ᄇ": 937,
"##ᅧ": 938,
"##ᆼ": 939,
"##ᄋ": 940,
"##ᆫ": 941,
"##ᅢ": 942,
"##ε": 943,
"##ρ": 944,
"##α": 945,
"##ς": 946,
"##ش": 947,
"##م": 948,
"##و": 949,
"##フ": 950,
"##ロ": 951,
"##ð": 952,
"##ხ": 953,
"##3": 954,
"##æ": 955,
"##ল": 956,
"##ɡ": 957,
"##ع": 958,
"##π": 959,
"##κ": 960,
"##ο": 961,
"##ق": 962,
"##ت": 963,
"##ɒ": 964,
"##χ": 965,
"##λ": 966,
"##ภ": 967,
"##ด": 968,
"##п": 969,
"##г": 970,
"##れ": 971,
"##る": 972,
"##פ": 973,
"##ה": 974,
"##ा": 975,
"##न": 976,
"##ਲ": 977,
"##ਹ": 978,
"##ɛ": 979,
"##ʊ": 980,
"##ᅮ": 981,
"##は": 982,
"##り": 983,
"##く": 984,
"##あ": 985,
"##ν": 986,
"##μ": 987,
"##อ": 988,
"##ก": 989,
"##ว": 990,
"##ܕ": 991,
"##ܝ": 992,
"##ܢ": 993,
"##ܬ": 994,
"##ォ": 995,
"##ه": 996,
"##з": 997,
"##シ": 998,
"##მ": 999,
"##წ": 1000,
"##ფ": 1001,
"##つ": 1002,
"##か": 1003,
"##ค": 1004,
"##ण": 1005,
"##ई": 1006,
"##ξ": 1007,
"##も": 1008,
"##み": 1009,
"##д": 1010,
"##ж": 1011,
"##т": 1012,
"##व": 1013,
"##द": 1014,
"##ह": 1015,
"##ि": 1016,
"##क": 1017,
"##ω": 1018,
"##お": 1019,
"##ʻ": 1020,
"##ซ": 1021,
"##せ": 1022,
"##ん": 1023,
"##œ": 1024,
"##こ": 1025,
"##ら": 1026,
"##া": 1027,
"##হ": 1028,
"##η": 1029,
"##ß": 1030,
"##ჱ": 1031,
"##ı": 1032,
"##ث": 1033,
"##ᵻ": 1034,
"##υ": 1035,
"##θ": 1036,
"##ɽ": 1037,
"##ょ": 1038,
"##に": 1039,
"##γ": 1040,
"##を": 1041,
"##พ": 1042,
"##わ": 1043,
"##い": 1044,
"##ш": 1045,
"##თ": 1046,
"##め": 1047,
"##カ": 1048,
"##ʿ": 1049,
"##ר": 1050,
"##ם": 1051,
"##ჲ": 1052,
"##ネ": 1053,
"##ョ": 1054,
"##ψ": 1055,
"##ち": 1056,
"##ゃ": 1057,
"##σ": 1058,
"##დ": 1059,
"##र": 1060,
"##タ": 1061,
"##ム": 1062,
"##ェ": 1063,
"##ء": 1064,
"##ל": 1065,
"##ɫ": 1066,
"##х": 1067,
"##ᅡ": 1068,
"##ᆯ": 1069,
"##ゥ": 1070,
"##イ": 1071,
"##ฮ": 1072,
"##ง": 1073,
"##ไ": 1074,
"##ช": 1075,
"##แ": 1076,
"##ग": 1077,
"##خ": 1078,
"##ま": 1079,
"##ノ": 1080,
"##ס": 1081,
"##ャ": 1082,
"##モ": 1083,
"##ल": 1084,
"##ו": 1085,
"##ح": 1086,
"##ц": 1087,
"##ь": 1088,
"##ף": 1089,
"##ള": 1090,
"##δ": 1091,
"##ਾ": 1092,
"##м": 1093,
"##ษ": 1094,
"##ฐ": 1095,
"##ാ": 1096,
"##ഹ": 1097,
"##ツ": 1098,
"##セ": 1099,
"##オ": 1100,
"##ʒ": 1101,
"##ქ": 1102,
"##ю": 1103,
"##ʁ": 1104,
"##ˌ": 1105,
"##स": 1106,
"##ص": 1107,
"##º": 1108,
"##エ": 1109,
"##ミ": 1110,
"##ש": 1111,
"##מ": 1112,
"##צ": 1113,
"##ɜ": 1114,
"##ܠ": 1115,
"##ܗ": 1116,
"##ܐ": 1117,
"##ะ": 1118,
"##น": 1119,
"##є": 1120,
"##ゆ": 1121,
"##ɳ": 1122,
"##נ": 1123,
"##ჳ": 1124
}
}
}