{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 0, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 1, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 2, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 3, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true }, { "id": 4, "content": "[UNK]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 5, "content": "", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "BertNormalizer", "clean_text": true, "handle_chinese_chars": true, "strip_accents": null, "lowercase": true }, "pre_tokenizer": { "type": "BertPreTokenizer" }, "post_processor": { "type": "RobertaProcessing", "sep": [ "", 2 ], "cls": [ "", 0 ], "trim_offsets": true, "add_prefix_space": false }, "decoder": { "type": "WordPiece", "prefix": "##", "cleanup": true }, "model": { "type": "WordPiece", "unk_token": "[UNK]", "continuing_subword_prefix": "##", "max_input_chars_per_word": 100, "vocab": { "": 0, "": 1, "": 2, "": 3, "[UNK]": 4, "": 5, "!": 6, "\"": 7, "#": 8, "$": 9, "%": 10, "&": 11, "'": 12, "(": 13, ")": 14, "*": 15, "+": 16, ",": 17, "-": 18, ".": 19, "/": 20, "0": 21, "1": 22, "2": 23, "3": 24, "4": 25, "5": 26, "6": 27, "7": 28, "8": 29, "9": 30, ":": 31, ";": 32, "<": 33, "=": 34, ">": 35, "?": 36, "@": 37, "[": 38, "\\": 39, "]": 40, "^": 41, "_": 42, "`": 43, "a": 44, "b": 45, "c": 46, "d": 47, "e": 48, "f": 49, "g": 50, "h": 51, "i": 52, "j": 53, "k": 54, "l": 55, "m": 56, "n": 57, "o": 58, "p": 59, "q": 60, "r": 61, "s": 62, "t": 63, "u": 64, "v": 65, "w": 66, "x": 67, "y": 68, "z": 69, "|": 70, "}": 71, "~": 72, "¡": 73, "¢": 74, "£": 75, "¥": 76, "§": 77, "°": 78, "±": 79, "²": 80, "³": 81, "´": 82, "µ": 83, "·": 84, "º": 85, "½": 86, "¿": 87, "×": 88, "ß": 89, "æ": 90, "ð": 91, "ø": 92, "þ": 93, "đ": 94, "ħ": 95, "ı": 96, "ł": 97, "œ": 98, "ɐ": 99, "ɑ": 100, "ɒ": 101, "ɔ": 102, "ə": 103, "ɛ": 104, "ɜ": 105, "ɡ": 106, "ɢ": 107, "ɪ": 108, "ɫ": 109, "ɳ": 110, "ɽ": 111, "ɾ": 112, "ʁ": 113, "ʃ": 114, "ʊ": 115, "ʋ": 116, "ʒ": 117, "ʔ": 118, "ʕ": 119, "ʲ": 120, "ʻ": 121, "ʼ": 122, "ʾ": 123, "ʿ": 124, "ˈ": 125, "ˌ": 126, "ː": 127, "α": 128, "β": 129, "γ": 130, "δ": 131, "ε": 132, "η": 133, "θ": 134, "ι": 135, "κ": 136, "λ": 137, "μ": 138, "ν": 139, "ξ": 140, "ο": 141, "π": 142, "ρ": 143, "ς": 144, "σ": 145, "τ": 146, "υ": 147, "φ": 148, "χ": 149, "ψ": 150, "ω": 151, "а": 152, "б": 153, "в": 154, "г": 155, "д": 156, "е": 157, "ж": 158, "з": 159, "и": 160, "к": 161, "л": 162, "м": 163, "н": 164, "о": 165, "п": 166, "р": 167, "с": 168, "т": 169, "у": 170, "х": 171, "ц": 172, "ш": 173, "ъ": 174, "ы": 175, "ь": 176, "ю": 177, "я": 178, "є": 179, "א": 180, "ב": 181, "ג": 182, "ה": 183, "ו": 184, "ז": 185, "ח": 186, "י": 187, "ל": 188, "ם": 189, "מ": 190, "ן": 191, "נ": 192, "ס": 193, "ף": 194, "פ": 195, "צ": 196, "ר": 197, "ש": 198, "ת": 199, "ء": 200, "ا": 201, "ب": 202, "ة": 203, "ت": 204, "ث": 205, "ج": 206, "ح": 207, "خ": 208, "د": 209, "ذ": 210, "ر": 211, "س": 212, "ش": 213, "ص": 214, "ع": 215, "ف": 216, "ق": 217, "ك": 218, "ل": 219, "م": 220, "ن": 221, "ه": 222, "و": 223, "ي": 224, "ܐ": 225, "ܕ": 226, "ܗ": 227, "ܝ": 228, "ܠ": 229, "ܢ": 230, "ܬ": 231, "अ": 232, "ई": 233, "क": 234, "ग": 235, "ण": 236, "त": 237, "द": 238, "न": 239, "प": 240, "ब": 241, "म": 242, "य": 243, "र": 244, "ल": 245, "व": 246, "स": 247, "ह": 248, "ा": 249, "ि": 250, "আ": 251, "ল": 252, "হ": 253, "া": 254, "ਅ": 255, "ਲ": 256, "ਹ": 257, "ਾ": 258, "അ": 259, "ള": 260, "ഹ": 261, "ാ": 262, "ก": 263, "ค": 264, "ง": 265, "ช": 266, "ซ": 267, "ญ": 268, "ฐ": 269, "ณ": 270, "ด": 271, "ต": 272, "น": 273, "บ": 274, "ป": 275, "พ": 276, "ภ": 277, "ม": 278, "ย": 279, "ร": 280, "ล": 281, "ว": 282, "ศ": 283, "ษ": 284, "ส": 285, "ห": 286, "อ": 287, "ฮ": 288, "ะ": 289, "า": 290, "เ": 291, "แ": 292, "ไ": 293, "ა": 294, "ბ": 295, "გ": 296, "დ": 297, "ე": 298, "ვ": 299, "ზ": 300, "თ": 301, "ი": 302, "კ": 303, "ლ": 304, "მ": 305, "ნ": 306, "ო": 307, "პ": 308, "ჟ": 309, "რ": 310, "ს": 311, "ტ": 312, "უ": 313, "ფ": 314, "ქ": 315, "ღ": 316, "ყ": 317, "შ": 318, "ჩ": 319, "ც": 320, "ძ": 321, "წ": 322, "ჭ": 323, "ხ": 324, "ჯ": 325, "ჰ": 326, "ჱ": 327, "ჲ": 328, "ჳ": 329, "ჴ": 330, "ჵ": 331, "ჶ": 332, "ჷ": 333, "ჸ": 334, "ჹ": 335, "ჺ": 336, "჻": 337, "ᄃ": 338, "ᄅ": 339, "ᄇ": 340, "ᄋ": 341, "ᄌ": 342, "ᅡ": 343, "ᅢ": 344, "ᅦ": 345, "ᅧ": 346, "ᅩ": 347, "ᅮ": 348, "ᅵ": 349, "ᆨ": 350, "ᆫ": 351, "ᆯ": 352, "ᆸ": 353, "ᆼ": 354, "ᵻ": 355, "‐": 356, "‑": 357, "–": 358, "—": 359, "―": 360, "‘": 361, "’": 362, "“": 363, "”": 364, "„": 365, "†": 366, "‡": 367, "•": 368, "…": 369, "′": 370, "″": 371, "⁄": 372, "₣": 373, "₤": 374, "€": 375, "₹": 376, "⅓": 377, "⅔": 378, "→": 379, "−": 380, "≡": 381, "≤": 382, "①": 383, "☉": 384, "☫": 385, "♀": 386, "♭": 387, "♯": 388, "⚳": 389, "ⴀ": 390, "ⴂ": 391, "ⴃ": 392, "ⴈ": 393, "ⴌ": 394, "ⴕ": 395, "ⴟ": 396, "〈": 397, "〉": 398, "〜": 399, "あ": 400, "い": 401, "う": 402, "お": 403, "か": 404, "き": 405, "く": 406, "け": 407, "こ": 408, "さ": 409, "し": 410, "す": 411, "せ": 412, "た": 413, "ち": 414, "っ": 415, "つ": 416, "と": 417, "な": 418, "に": 419, "の": 420, "は": 421, "ひ": 422, "ふ": 423, "ほ": 424, "ま": 425, "み": 426, "め": 427, "も": 428, "ゃ": 429, "ゆ": 430, "ょ": 431, "ら": 432, "り": 433, "る": 434, "れ": 435, "わ": 436, "を": 437, "ん": 438, "ァ": 439, "ア": 440, "ィ": 441, "イ": 442, "ゥ": 443, "ウ": 444, "ェ": 445, "エ": 446, "ォ": 447, "オ": 448, "カ": 449, "キ": 450, "ク": 451, "ケ": 452, "コ": 453, "サ": 454, "シ": 455, "ス": 456, "セ": 457, "タ": 458, "チ": 459, "ッ": 460, "ツ": 461, "テ": 462, "ト": 463, "ナ": 464, "ニ": 465, "ネ": 466, "ノ": 467, "ハ": 468, "フ": 469, "ヘ": 470, "マ": 471, "ミ": 472, "ム": 473, "モ": 474, "ャ": 475, "ュ": 476, "ョ": 477, "ラ": 478, "リ": 479, "ル": 480, "レ": 481, "ロ": 482, "ン": 483, "・": 484, "ー": 485, "一": 486, "七": 487, "下": 488, "世": 489, "丙": 490, "中": 491, "主": 492, "乃": 493, "之": 494, "乙": 495, "九": 496, "二": 497, "云": 498, "人": 499, "今": 500, "付": 501, "作": 502, "侗": 503, "依": 504, "信": 505, "傳": 506, "儚": 507, "充": 508, "光": 509, "全": 510, "兵": 511, "其": 512, "具": 513, "円": 514, "再": 515, "出": 516, "判": 517, "前": 518, "剛": 519, "劇": 520, "劉": 521, "動": 522, "化": 523, "北": 524, "华": 525, "厂": 526, "去": 527, "古": 528, "可": 529, "台": 530, "史": 531, "同": 532, "名": 533, "君": 534, "吳": 535, "周": 536, "命": 537, "和": 538, "咲": 539, "善": 540, "四": 541, "國": 542, "園": 543, "圣": 544, "在": 545, "坂": 546, "堤": 547, "場": 548, "塘": 549, "夕": 550, "大": 551, "天": 552, "夫": 553, "女": 554, "妙": 555, "姚": 556, "子": 557, "孟": 558, "守": 559, "安": 560, "宋": 561, "完": 562, "宗": 563, "宝": 564, "宫": 565, "寝": 566, "寺": 567, "小": 568, "少": 569, "尾": 570, "山": 571, "岳": 572, "川": 573, "州": 574, "巳": 575, "市": 576, "師": 577, "平": 578, "广": 579, "庆": 580, "府": 581, "座": 582, "廬": 583, "建": 584, "式": 585, "張": 586, "彌": 587, "彩": 588, "彼": 589, "後": 590, "御": 591, "德": 592, "思": 593, "愛": 594, "憑": 595, "憶": 596, "應": 597, "懷": 598, "战": 599, "戦": 600, "扈": 601, "技": 602, "拉": 603, "拳": 604, "挑": 605, "揺": 606, "攻": 607, "放": 608, "政": 609, "散": 610, "斯": 611, "方": 612, "日": 613, "旦": 614, "旭": 615, "昌": 616, "明": 617, "星": 618, "春": 619, "晋": 620, "景": 621, "曦": 622, "月": 623, "望": 624, "未": 625, "本": 626, "李": 627, "村": 628, "杜": 629, "束": 630, "来": 631, "林": 632, "桜": 633, "梶": 634, "棘": 635, "椎": 636, "楊": 637, "楚": 638, "榮": 639, "橘": 640, "機": 641, "正": 642, "殻": 643, "殿": 644, "母": 645, "水": 646, "汉": 647, "沂": 648, "沙": 649, "河": 650, "泗": 651, "波": 652, "泣": 653, "洪": 654, "淹": 655, "清": 656, "湯": 657, "漢": 658, "澄": 659, "澤": 660, "火": 661, "灯": 662, "灵": 663, "灼": 664, "焼": 665, "熱": 666, "物": 667, "狐": 668, "狸": 669, "玄": 670, "王": 671, "玩": 672, "珂": 673, "珙": 674, "球": 675, "理": 676, "琦": 677, "琪": 678, "瓊": 679, "生": 680, "田": 681, "畢": 682, "番": 683, "瘡": 684, "白": 685, "皮": 686, "真": 687, "砲": 688, "礮": 689, "祈": 690, "神": 691, "祠": 692, "秋": 693, "空": 694, "立": 695, "精": 696, "約": 697, "絵": 698, "織": 699, "義": 700, "翠": 701, "者": 702, "耕": 703, "肖": 704, "胡": 705, "膀": 706, "臂": 707, "興": 708, "良": 709, "花": 710, "芳": 711, "芽": 712, "若": 713, "英": 714, "藕": 715, "藥": 716, "蘄": 717, "蘇": 718, "行": 719, "裁": 720, "規": 721, "覺": 722, "观": 723, "解": 724, "記": 725, "誓": 726, "誡": 727, "誰": 728, "謎": 729, "许": 730, "谭": 731, "豪": 732, "豫": 733, "費": 734, "贵": 735, "赤": 736, "趙": 737, "足": 738, "跡": 739, "転": 740, "辛": 741, "逆": 742, "遇": 743, "運": 744, "過": 745, "遠": 746, "選": 747, "邦": 748, "邱": 749, "部": 750, "郭": 751, "都": 752, "酈": 753, "里": 754, "野": 755, "金": 756, "銃": 757, "鋼": 758, "錄": 759, "錡": 760, "鍵": 761, "鐵": 762, "钱": 763, "铁": 764, "關": 765, "防": 766, "阿": 767, "陈": 768, "陳": 769, "陽": 770, "隊": 771, "階": 772, "集": 773, "雪": 774, "雲": 775, "霖": 776, "霹": 777, "靂": 778, "韓": 779, "願": 780, "顯": 781, "颜": 782, "马": 783, "高": 784, "龍": 785, "ﷲ": 786, "ﻋ": 787, "/": 788, "3": 789, "~": 790, "##s": 791, "##p": 792, "##e": 793, "##n": 794, "##a": 795, "##t": 796, "##h": 797, "##r": 798, "##i": 799, "##g": 800, "##4": 801, "##9": 802, "##v": 803, "##u": 804, "##l": 805, "##c": 806, "##y": 807, "##m": 808, "##o": 809, "##d": 810, "##q": 811, "##f": 812, "##b": 813, "##j": 814, "##k": 815, "##w": 816, "##z": 817, "##6": 818, "##0": 819, "##1": 820, "##x": 821, "##8": 822, "##7": 823, "##3": 824, "##2": 825, "##а": 826, "##л": 827, "##ы": 828, "##и": 829, "##ル": 830, "##ハ": 831, "##ト": 832, "##ス": 833, "##5": 834, "##р": 835, "##с": 836, "##н": 837, "##ɪ": 838, "##ʃ": 839, "##ɑ": 840, "##ː": 841, "##ი": 842, "##ウ": 843, "##ァ": 844, "##キ": 845, "##ュ": 846, "##リ": 847, "##ア": 848, "##う": 849, "##き": 850, "##ł": 851, "##ッ": 852, "##ク": 853, "##マ": 854, "##ン": 855, "##テ": 856, "##ィ": 857, "##ニ": 858, "##ー": 859, "##ل": 860, "##ا": 861, "##ب": 862, "##ن": 863, "##ล": 864, "##ย": 865, "##า": 866, "##ณ": 867, "##ม": 868, "##ต": 869, "##ร": 870, "##τ": 871, "##ι": 872, "##β": 873, "##เ": 874, "##ป": 875, "##რ": 876, "##გ": 877, "##ვ": 878, "##ლ": 879, "##ო": 880, "##ა": 881, "##ნ": 882, "##ラ": 883, "##ъ": 884, "##к": 885, "##в": 886, "##đ": 887, "##ø": 888, "##ɾ": 889, "##ʲ": 890, "##ə": 891, "##ˈ": 892, "##ב": 893, "##ת": 894, "##א": 895, "##י": 896, "##ك": 897, "##ر": 898, "##د": 899, "##っ": 900, "##е": 901, "##о": 902, "##у": 903, "##я": 904, "##ɔ": 905, "##ʔ": 906, "##ذ": 907, "##ي": 908, "##ة": 909, "##ს": 910, "##ტ": 911, "##ე": 912, "##サ": 913, "##た": 914, "##し": 915, "##の": 916, "##す": 917, "##な": 918, "##ひ": 919, "##と": 920, "##ן": 921, "##レ": 922, "##チ": 923, "##ナ": 924, "##უ": 925, "##ც": 926, "##ف": 927, "##س": 928, "##ɐ": 929, "##ᅦ": 930, "##ᄃ": 931, "##ᅩ": 932, "##ᆨ": 933, "##ᄅ": 934, "##ᅵ": 935, "##ᆸ": 936, "##ᄇ": 937, "##ᅧ": 938, "##ᆼ": 939, "##ᄋ": 940, "##ᆫ": 941, "##ᅢ": 942, "##ε": 943, "##ρ": 944, "##α": 945, "##ς": 946, "##ش": 947, "##م": 948, "##و": 949, "##フ": 950, "##ロ": 951, "##ð": 952, "##ხ": 953, "##3": 954, "##æ": 955, "##ল": 956, "##ɡ": 957, "##ع": 958, "##π": 959, "##κ": 960, "##ο": 961, "##ق": 962, "##ت": 963, "##ɒ": 964, "##χ": 965, "##λ": 966, "##ภ": 967, "##ด": 968, "##п": 969, "##г": 970, "##れ": 971, "##る": 972, "##פ": 973, "##ה": 974, "##ा": 975, "##न": 976, "##ਲ": 977, "##ਹ": 978, "##ɛ": 979, "##ʊ": 980, "##ᅮ": 981, "##は": 982, "##り": 983, "##く": 984, "##あ": 985, "##ν": 986, "##μ": 987, "##อ": 988, "##ก": 989, "##ว": 990, "##ܕ": 991, "##ܝ": 992, "##ܢ": 993, "##ܬ": 994, "##ォ": 995, "##ه": 996, "##з": 997, "##シ": 998, "##მ": 999, "##წ": 1000, "##ფ": 1001, "##つ": 1002, "##か": 1003, "##ค": 1004, "##ण": 1005, "##ई": 1006, "##ξ": 1007, "##も": 1008, "##み": 1009, "##д": 1010, "##ж": 1011, "##т": 1012, "##व": 1013, "##द": 1014, "##ह": 1015, "##ि": 1016, "##क": 1017, "##ω": 1018, "##お": 1019, "##ʻ": 1020, "##ซ": 1021, "##せ": 1022, "##ん": 1023, "##œ": 1024, "##こ": 1025, "##ら": 1026, "##া": 1027, "##হ": 1028, "##η": 1029, "##ß": 1030, "##ჱ": 1031, "##ı": 1032, "##ث": 1033, "##ᵻ": 1034, "##υ": 1035, "##θ": 1036, "##ɽ": 1037, "##ょ": 1038, "##に": 1039, "##γ": 1040, "##を": 1041, "##พ": 1042, "##わ": 1043, "##い": 1044, "##ш": 1045, "##თ": 1046, "##め": 1047, "##カ": 1048, "##ʿ": 1049, "##ר": 1050, "##ם": 1051, "##ჲ": 1052, "##ネ": 1053, "##ョ": 1054, "##ψ": 1055, "##ち": 1056, "##ゃ": 1057, "##σ": 1058, "##დ": 1059, "##र": 1060, "##タ": 1061, "##ム": 1062, "##ェ": 1063, "##ء": 1064, "##ל": 1065, "##ɫ": 1066, "##х": 1067, "##ᅡ": 1068, "##ᆯ": 1069, "##ゥ": 1070, "##イ": 1071, "##ฮ": 1072, "##ง": 1073, "##ไ": 1074, "##ช": 1075, "##แ": 1076, "##ग": 1077, "##خ": 1078, "##ま": 1079, "##ノ": 1080, "##ס": 1081, "##ャ": 1082, "##モ": 1083, "##ल": 1084, "##ו": 1085, "##ح": 1086, "##ц": 1087, "##ь": 1088, "##ף": 1089, "##ള": 1090, "##δ": 1091, "##ਾ": 1092, "##м": 1093, "##ษ": 1094, "##ฐ": 1095, "##ാ": 1096, "##ഹ": 1097, "##ツ": 1098, "##セ": 1099, "##オ": 1100, "##ʒ": 1101, "##ქ": 1102, "##ю": 1103, "##ʁ": 1104, "##ˌ": 1105, "##स": 1106, "##ص": 1107, "##º": 1108, "##エ": 1109, "##ミ": 1110, "##ש": 1111, "##מ": 1112, "##צ": 1113, "##ɜ": 1114, "##ܠ": 1115, "##ܗ": 1116, "##ܐ": 1117, "##ะ": 1118, "##น": 1119, "##є": 1120, "##ゆ": 1121, "##ɳ": 1122, "##נ": 1123, "##ჳ": 1124 } } }