{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 0, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 1, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 2, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 3, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 4, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 5, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 6, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "BertNormalizer", "clean_text": true, "handle_chinese_chars": true, "strip_accents": null, "lowercase": true }, "pre_tokenizer": { "type": "BertPreTokenizer" }, "post_processor": { "type": "TemplateProcessing", "single": [ { "SpecialToken": { "id": "", "type_id": 2 } }, { "Sequence": { "id": "A", "type_id": 0 } }, { "SpecialToken": { "id": "", "type_id": 0 } } ], "pair": [ { "SpecialToken": { "id": "", "type_id": 2 } }, { "Sequence": { "id": "A", "type_id": 0 } }, { "SpecialToken": { "id": "", "type_id": 0 } }, { "Sequence": { "id": "B", "type_id": 1 } }, { "SpecialToken": { "id": "", "type_id": 1 } } ], "special_tokens": { "": { "id": "", "ids": [ 4 ], "tokens": [ "" ] }, "": { "id": "", "ids": [ 5 ], "tokens": [ "" ] } } }, "decoder": { "type": "WordPiece", "prefix": "##", "cleanup": true }, "model": { "type": "WordPiece", "unk_token": "", "continuing_subword_prefix": "##", "max_input_chars_per_word": 100, "vocab": { "": 0, "": 1, "": 2, "": 3, "": 4, "": 5, "": 6, "!": 7, "\"": 8, "#": 9, "$": 10, "%": 11, "&": 12, "'": 13, "(": 14, ")": 15, "*": 16, "+": 17, ",": 18, "-": 19, ".": 20, "/": 21, "0": 22, "1": 23, "2": 24, "3": 25, "4": 26, "5": 27, "6": 28, "7": 29, "8": 30, "9": 31, ":": 32, ";": 33, "<": 34, "=": 35, ">": 36, "?": 37, "@": 38, "[": 39, "\\": 40, "]": 41, "^": 42, "_": 43, "`": 44, "a": 45, "b": 46, "c": 47, "d": 48, "e": 49, "f": 50, "g": 51, "h": 52, "i": 53, "j": 54, "k": 55, "l": 56, "m": 57, "n": 58, "o": 59, "p": 60, "q": 61, "r": 62, "s": 63, "t": 64, "u": 65, "v": 66, "w": 67, "x": 68, "y": 69, "z": 70, "|": 71, "}": 72, "~": 73, "¡": 74, "¢": 75, "£": 76, "¥": 77, "§": 78, "°": 79, "±": 80, "²": 81, "³": 82, "´": 83, "µ": 84, "·": 85, "º": 86, "½": 87, "¿": 88, "×": 89, "ß": 90, "æ": 91, "ð": 92, "ø": 93, "þ": 94, "đ": 95, "ħ": 96, "ı": 97, "ł": 98, "œ": 99, "ɐ": 100, "ɑ": 101, "ɒ": 102, "ɔ": 103, "ə": 104, "ɛ": 105, "ɜ": 106, "ɡ": 107, "ɢ": 108, "ɪ": 109, "ɫ": 110, "ɳ": 111, "ɽ": 112, "ɾ": 113, "ʁ": 114, "ʃ": 115, "ʊ": 116, "ʋ": 117, "ʒ": 118, "ʔ": 119, "ʕ": 120, "ʲ": 121, "ʻ": 122, "ʼ": 123, "ʾ": 124, "ʿ": 125, "ˈ": 126, "ˌ": 127, "ː": 128, "α": 129, "β": 130, "γ": 131, "δ": 132, "ε": 133, "η": 134, "θ": 135, "ι": 136, "κ": 137, "λ": 138, "μ": 139, "ν": 140, "ξ": 141, "ο": 142, "π": 143, "ρ": 144, "ς": 145, "σ": 146, "τ": 147, "υ": 148, "φ": 149, "χ": 150, "ψ": 151, "ω": 152, "а": 153, "б": 154, "в": 155, "г": 156, "д": 157, "е": 158, "ж": 159, "з": 160, "и": 161, "к": 162, "л": 163, "м": 164, "н": 165, "о": 166, "п": 167, "р": 168, "с": 169, "т": 170, "у": 171, "х": 172, "ц": 173, "ш": 174, "ъ": 175, "ы": 176, "ь": 177, "ю": 178, "я": 179, "є": 180, "א": 181, "ב": 182, "ג": 183, "ה": 184, "ו": 185, "ז": 186, "ח": 187, "י": 188, "ל": 189, "ם": 190, "מ": 191, "ן": 192, "נ": 193, "ס": 194, "ף": 195, "פ": 196, "צ": 197, "ר": 198, "ש": 199, "ת": 200, "ء": 201, "ا": 202, "ب": 203, "ة": 204, "ت": 205, "ث": 206, "ج": 207, "ح": 208, "خ": 209, "د": 210, "ذ": 211, "ر": 212, "س": 213, "ش": 214, "ص": 215, "ع": 216, "ف": 217, "ق": 218, "ك": 219, "ل": 220, "م": 221, "ن": 222, "ه": 223, "و": 224, "ي": 225, "ܐ": 226, "ܕ": 227, "ܗ": 228, "ܝ": 229, "ܠ": 230, "ܢ": 231, "ܬ": 232, "अ": 233, "ई": 234, "क": 235, "ग": 236, "ण": 237, "त": 238, "द": 239, "न": 240, "प": 241, "ब": 242, "म": 243, "य": 244, "र": 245, "ल": 246, "व": 247, "स": 248, "ह": 249, "ा": 250, "ि": 251, "আ": 252, "ল": 253, "হ": 254, "া": 255, "ਅ": 256, "ਲ": 257, "ਹ": 258, "ਾ": 259, "അ": 260, "ള": 261, "ഹ": 262, "ാ": 263, "ก": 264, "ค": 265, "ง": 266, "ช": 267, "ซ": 268, "ญ": 269, "ฐ": 270, "ณ": 271, "ด": 272, "ต": 273, "น": 274, "บ": 275, "ป": 276, "พ": 277, "ภ": 278, "ม": 279, "ย": 280, "ร": 281, "ล": 282, "ว": 283, "ศ": 284, "ษ": 285, "ส": 286, "ห": 287, "อ": 288, "ฮ": 289, "ะ": 290, "า": 291, "เ": 292, "แ": 293, "ไ": 294, "ა": 295, "ბ": 296, "გ": 297, "დ": 298, "ე": 299, "ვ": 300, "ზ": 301, "თ": 302, "ი": 303, "კ": 304, "ლ": 305, "მ": 306, "ნ": 307, "ო": 308, "პ": 309, "ჟ": 310, "რ": 311, "ს": 312, "ტ": 313, "უ": 314, "ფ": 315, "ქ": 316, "ღ": 317, "ყ": 318, "შ": 319, "ჩ": 320, "ც": 321, "ძ": 322, "წ": 323, "ჭ": 324, "ხ": 325, "ჯ": 326, "ჰ": 327, "ჱ": 328, "ჲ": 329, "ჳ": 330, "ჴ": 331, "ჵ": 332, "ჶ": 333, "ჷ": 334, "ჸ": 335, "ჹ": 336, "ჺ": 337, "჻": 338, "ᄃ": 339, "ᄅ": 340, "ᄇ": 341, "ᄋ": 342, "ᄌ": 343, "ᅡ": 344, "ᅢ": 345, "ᅦ": 346, "ᅧ": 347, "ᅩ": 348, "ᅮ": 349, "ᅵ": 350, "ᆨ": 351, "ᆫ": 352, "ᆯ": 353, "ᆸ": 354, "ᆼ": 355, "ᵻ": 356, "‐": 357, "‑": 358, "–": 359, "—": 360, "―": 361, "‘": 362, "’": 363, "“": 364, "”": 365, "„": 366, "†": 367, "‡": 368, "•": 369, "…": 370, "′": 371, "″": 372, "⁄": 373, "₣": 374, "₤": 375, "€": 376, "₹": 377, "⅓": 378, "⅔": 379, "→": 380, "−": 381, "≡": 382, "≤": 383, "①": 384, "☉": 385, "☫": 386, "♀": 387, "♭": 388, "♯": 389, "⚳": 390, "ⴀ": 391, "ⴂ": 392, "ⴃ": 393, "ⴈ": 394, "ⴌ": 395, "ⴕ": 396, "ⴟ": 397, "〈": 398, "〉": 399, "〜": 400, "あ": 401, "い": 402, "う": 403, "お": 404, "か": 405, "き": 406, "く": 407, "け": 408, "こ": 409, "さ": 410, "し": 411, "す": 412, "せ": 413, "た": 414, "ち": 415, "っ": 416, "つ": 417, "と": 418, "な": 419, "に": 420, "の": 421, "は": 422, "ひ": 423, "ふ": 424, "ほ": 425, "ま": 426, "み": 427, "め": 428, "も": 429, "ゃ": 430, "ゆ": 431, "ょ": 432, "ら": 433, "り": 434, "る": 435, "れ": 436, "わ": 437, "を": 438, "ん": 439, "ァ": 440, "ア": 441, "ィ": 442, "イ": 443, "ゥ": 444, "ウ": 445, "ェ": 446, "エ": 447, "ォ": 448, "オ": 449, "カ": 450, "キ": 451, "ク": 452, "ケ": 453, "コ": 454, "サ": 455, "シ": 456, "ス": 457, "セ": 458, "タ": 459, "チ": 460, "ッ": 461, "ツ": 462, "テ": 463, "ト": 464, "ナ": 465, "ニ": 466, "ネ": 467, "ノ": 468, "ハ": 469, "フ": 470, "ヘ": 471, "マ": 472, "ミ": 473, "ム": 474, "モ": 475, "ャ": 476, "ュ": 477, "ョ": 478, "ラ": 479, "リ": 480, "ル": 481, "レ": 482, "ロ": 483, "ン": 484, "・": 485, "ー": 486, "一": 487, "七": 488, "下": 489, "世": 490, "丙": 491, "中": 492, "主": 493, "乃": 494, "之": 495, "乙": 496, "九": 497, "二": 498, "云": 499, "人": 500, "今": 501, "付": 502, "作": 503, "侗": 504, "依": 505, "信": 506, "傳": 507, "儚": 508, "充": 509, "光": 510, "全": 511, "兵": 512, "其": 513, "具": 514, "円": 515, "再": 516, "出": 517, "判": 518, "前": 519, "剛": 520, "劇": 521, "劉": 522, "動": 523, "化": 524, "北": 525, "华": 526, "厂": 527, "去": 528, "古": 529, "可": 530, "台": 531, "史": 532, "同": 533, "名": 534, "君": 535, "吳": 536, "周": 537, "命": 538, "和": 539, "咲": 540, "善": 541, "四": 542, "國": 543, "園": 544, "圣": 545, "在": 546, "坂": 547, "堤": 548, "場": 549, "塘": 550, "夕": 551, "大": 552, "天": 553, "夫": 554, "女": 555, "妙": 556, "姚": 557, "子": 558, "孟": 559, "守": 560, "安": 561, "宋": 562, "完": 563, "宗": 564, "宝": 565, "宫": 566, "寝": 567, "寺": 568, "小": 569, "少": 570, "尾": 571, "山": 572, "岳": 573, "川": 574, "州": 575, "巳": 576, "市": 577, "師": 578, "平": 579, "广": 580, "庆": 581, "府": 582, "座": 583, "廬": 584, "建": 585, "式": 586, "張": 587, "彌": 588, "彩": 589, "彼": 590, "後": 591, "御": 592, "德": 593, "思": 594, "愛": 595, "憑": 596, "憶": 597, "應": 598, "懷": 599, "战": 600, "戦": 601, "扈": 602, "技": 603, "拉": 604, "拳": 605, "挑": 606, "揺": 607, "攻": 608, "放": 609, "政": 610, "散": 611, "斯": 612, "方": 613, "日": 614, "旦": 615, "旭": 616, "昌": 617, "明": 618, "星": 619, "春": 620, "晋": 621, "景": 622, "曦": 623, "月": 624, "望": 625, "未": 626, "本": 627, "李": 628, "村": 629, "杜": 630, "束": 631, "来": 632, "林": 633, "桜": 634, "梶": 635, "棘": 636, "椎": 637, "楊": 638, "楚": 639, "榮": 640, "橘": 641, "機": 642, "正": 643, "殻": 644, "殿": 645, "母": 646, "水": 647, "汉": 648, "沂": 649, "沙": 650, "河": 651, "泗": 652, "波": 653, "泣": 654, "洪": 655, "淹": 656, "清": 657, "湯": 658, "漢": 659, "澄": 660, "澤": 661, "火": 662, "灯": 663, "灵": 664, "灼": 665, "焼": 666, "熱": 667, "物": 668, "狐": 669, "狸": 670, "玄": 671, "王": 672, "玩": 673, "珂": 674, "珙": 675, "球": 676, "理": 677, "琦": 678, "琪": 679, "瓊": 680, "生": 681, "田": 682, "畢": 683, "番": 684, "瘡": 685, "白": 686, "皮": 687, "真": 688, "砲": 689, "礮": 690, "祈": 691, "神": 692, "祠": 693, "秋": 694, "空": 695, "立": 696, "精": 697, "約": 698, "絵": 699, "織": 700, "義": 701, "翠": 702, "者": 703, "耕": 704, "肖": 705, "胡": 706, "膀": 707, "臂": 708, "興": 709, "良": 710, "花": 711, "芳": 712, "芽": 713, "若": 714, "英": 715, "藕": 716, "藥": 717, "蘄": 718, "蘇": 719, "行": 720, "裁": 721, "規": 722, "覺": 723, "观": 724, "解": 725, "記": 726, "誓": 727, "誡": 728, "誰": 729, "謎": 730, "许": 731, "谭": 732, "豪": 733, "豫": 734, "費": 735, "贵": 736, "赤": 737, "趙": 738, "足": 739, "跡": 740, "転": 741, "辛": 742, "逆": 743, "遇": 744, "運": 745, "過": 746, "遠": 747, "選": 748, "邦": 749, "邱": 750, "部": 751, "郭": 752, "都": 753, "酈": 754, "里": 755, "野": 756, "金": 757, "銃": 758, "鋼": 759, "錄": 760, "錡": 761, "鍵": 762, "鐵": 763, "钱": 764, "铁": 765, "關": 766, "防": 767, "阿": 768, "陈": 769, "陳": 770, "陽": 771, "隊": 772, "階": 773, "集": 774, "雪": 775, "雲": 776, "霖": 777, "霹": 778, "靂": 779, "韓": 780, "願": 781, "顯": 782, "颜": 783, "马": 784, "高": 785, "龍": 786, "ﷲ": 787, "ﻋ": 788, "/": 789, "3": 790, "~": 791, "##a": 792, "##s": 793, "##h": 794, "##e": 795, "##r": 796, "##i": 797, "##n": 798, "##c": 799, "##p": 800, "##l": 801, "##o": 802, "##t": 803, "##b": 804, "##d": 805, "##m": 806, "##v": 807, "##g": 808, "##y": 809, "##u": 810, "##w": 811, "##3": 812, "##z": 813, "##k": 814, "##f": 815, "##0": 816, "##j": 817, "##9": 818, "##7": 819, "##6": 820, "##x": 821, "##q": 822, "##ʁ": 823, "##ᅦ": 824, "##ᄃ": 825, "##ᅩ": 826, "##ᆨ": 827, "##ᄅ": 828, "##ᅵ": 829, "##ᆸ": 830, "##ᄇ": 831, "##ᅧ": 832, "##ᆼ": 833, "##ᄋ": 834, "##ᆫ": 835, "##ᅢ": 836, "##1": 837, "##2": 838, "##4": 839, "##ł": 840, "##8": 841, "##5": 842, "##ɛ": 843, "##ə": 844, "##ˈ": 845, "##ʊ": 846, "##η": 847, "##μ": 848, "##τ": 849, "##ρ": 850, "##α": 851, "##ォ": 852, "##ル": 853, "##ト": 854, "##ゥ": 855, "##ナ": 856, "##ロ": 857, "##イ": 858, "##キ": 859, "##ъ": 860, "##з": 861, "##н": 862, "##е": 863, "##с": 864, "##и": 865, "##ャ": 866, "##モ": 867, "##ン": 868, "##ッ": 869, "##ラ": 870, "##ー": 871, "##া": 872, "##হ": 873, "##フ": 874, "##ɒ": 875, "##の": 876, "##な": 877, "##ら": 878, "##β": 879, "##ล": 880, "##ว": 881, "##ง": 882, "##พ": 883, "##ไ": 884, "##ช": 885, "##ย": 886, "##า": 887, "##ร": 888, "##ø": 889, "##ป": 890, "##し": 891, "##た": 892, "##ل": 893, "##ا": 894, "##ه": 895, "##ː": 896, "##อ": 897, "##ก": 898, "##º": 899, "##о": 900, "##в": 901, "##т": 902, "##к": 903, "##か": 904, "##う": 905, "##פ": 906, "##ה": 907, "##а": 908, "##л": 909, "##ы": 910, "##ث": 911, "##م": 912, "##د": 913, "##ჲ": 914, "##ɑ": 915, "##ܠ": 916, "##ܗ": 917, "##ܐ": 918, "##ლ": 919, "##მ": 920, "##წ": 921, "##ი": 922, "##ფ": 923, "##ე": 924, "##く": 925, "##み": 926, "##こ": 927, "##と": 928, "##ל": 929, "##א": 930, "##ხ": 931, "##დ": 932, "##ა": 933, "##რ": 934, "##ณ": 935, "##ม": 936, "##ต": 937, "##ɡ": 938, "##æ": 939, "##ᵻ": 940, "##ʒ": 941, "##カ": 942, "##χ": 943, "##გ": 944, "##ვ": 945, "##ו": 946, "##נ": 947, "##ク": 948, "##タ": 949, "##ム": 950, "##チ": 951, "##ェ": 952, "##ο": 953, "##υ": 954, "##ς": 955, "##д": 956, "##р": 957, "##ω": 958, "##ε": 959, "##ι": 960, "##ฮ": 961, "##ı": 962, "##י": 963, "##ס": 964, "##テ": 965, "##レ": 966, "##つ": 967, "##せ": 968, "##ん": 969, "##ภ": 970, "##ด": 971, "##き": 972, "##θ": 973, "##ɔ": 974, "##п": 975, "##り": 976, "##र": 977, "##ف": 978, "##ر": 979, "##س": 980, "##ن": 981, "##ɫ": 982, "##ש": 983, "##מ": 984, "##צ": 985, "##γ": 986, "##ツ": 987, "##ネ": 988, "##ാ": 989, "##ഹ": 990, "##ш": 991, "##ц": 992, "##ь": 993, "##ს": 994, "##ო": 995, "##თ": 996, "##უ": 997, "##ɪ": 998, "##れ": 999, "##い": 1000, "##ス": 1001, "##ィ": 1002, "##ハ": 1003, "##ʻ": 1004, "##ء": 1005, "##ʔ": 1006, "##ɜ": 1007, "##є": 1008, "##λ": 1009, "##ア": 1010, "##ן": 1011, "##っ": 1012, "##ょ": 1013, "##に": 1014, "##ב": 1015, "##ר": 1016, "##ם": 1017, "##ν": 1018, "##σ": 1019, "##ю": 1020, "##ള": 1021, "##ウ": 1022, "##ァ": 1023, "##ュ": 1024, "##リ": 1025, "##3": 1026, "##ჳ": 1027, "##ܕ": 1028, "##ܝ": 1029, "##ܢ": 1030, "##ܬ": 1031, "##đ": 1032, "##ტ": 1033, "##ð": 1034, "##ξ": 1035, "##す": 1036, "##ひ": 1037, "##ਲ": 1038, "##ਾ": 1039, "##ਹ": 1040, "##め": 1041, "##я": 1042, "##ي": 1043, "##ت": 1044, "##ल": 1045, "##あ": 1046, "##ʿ": 1047, "##ʃ": 1048, "##ा": 1049, "##द": 1050, "##ニ": 1051, "##δ": 1052, "##ɾ": 1053, "##ع": 1054, "##ة": 1055, "##シ": 1056, "##ョ": 1057, "##ई": 1058, "##ش": 1059, "##خ": 1060, "##ب": 1061, "##を": 1062, "##ค": 1063, "##ß": 1064, "##は": 1065, "##ˌ": 1066, "##ك": 1067, "##ण": 1068, "##ც": 1069, "##न": 1070, "##π": 1071, "##ち": 1072, "##ゃ": 1073, "##ψ": 1074, "##ق": 1075, "##و": 1076, "##ף": 1077, "##ษ": 1078, "##ฐ": 1079, "##ि": 1080, "##ゆ": 1081, "##κ": 1082, "##ซ": 1083, "##お": 1084, "##ᅡ": 1085, "##ᆯ": 1086, "##ص": 1087, "##ת": 1088, "##ذ": 1089, "##व": 1090, "##ह": 1091, "##क": 1092, "##マ": 1093, "##ნ": 1094, "##ɐ": 1095, "##ɽ": 1096, "##ま": 1097, "##х": 1098, "##у": 1099, "##る": 1100, "##サ": 1101, "##ɳ": 1102, "##セ": 1103, "##オ": 1104, "##エ": 1105, "##ᅮ": 1106, "##わ": 1107, "##ミ": 1108, "##स": 1109, "##แ": 1110, "##も": 1111, "##œ": 1112, "##ল": 1113, "##ქ": 1114, "##เ": 1115, "##ح": 1116, "##г": 1117, "##ж": 1118, "##ჱ": 1119, "##ग": 1120, "##ʲ": 1121, "##ะ": 1122, "##น": 1123, "##ノ": 1124, "##м": 1125 } } }