{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 0, "content": "[PAD]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 11, "content": "[UNK]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 12, "content": "[CLS]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 13, "content": "[SEP]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 14, "content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false, "special": true }, { "id": 591, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true }, { "id": 592, "content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true } ], "normalizer": null, "pre_tokenizer": { "type": "ByteLevel", "add_prefix_space": false, "trim_offsets": true, "use_regex": true }, "post_processor": { "type": "RobertaProcessing", "sep": [ "[SEP]", 13 ], "cls": [ "[CLS]", 12 ], "trim_offsets": true, "add_prefix_space": false }, "decoder": { "type": "ByteLevel", "add_prefix_space": true, "trim_offsets": true, "use_regex": true }, "model": { "type": "BPE", "dropout": null, "unk_token": null, "continuing_subword_prefix": "", "end_of_word_suffix": "", "fuse_unk": false, "byte_fallback": false, "ignore_merges": false, "vocab": { "[PAD]": 0, "[unused1]": 1, "[unused2]": 2, "[unused3]": 3, "[unused4]": 4, "[unused5]": 5, "[unused6]": 6, "[unused7]": 7, "[unused8]": 8, "[unused9]": 9, "[unused10]": 10, "[UNK]": 11, "[CLS]": 12, "[SEP]": 13, "[MASK]": 14, "c": 15, "C": 16, "(": 17, ")": 18, "O": 19, "1": 20, "2": 21, "=": 22, "N": 23, ".": 24, "n": 25, "3": 26, "F": 27, "Cl": 28, ">>": 29, "~": 30, "-": 31, "4": 32, "[C@H]": 33, "S": 34, "[C@@H]": 35, "[O-]": 36, "Br": 37, "#": 38, "/": 39, "[nH]": 40, "[N+]": 41, "s": 42, "5": 43, "o": 44, "P": 45, "[Na+]": 46, "[Si]": 47, "I": 48, "[Na]": 49, "[Pd]": 50, "[K+]": 51, "[K]": 52, "[P]": 53, "B": 54, "[C@]": 55, "[C@@]": 56, "[Cl-]": 57, "6": 58, "[OH-]": 59, "\\": 60, "[N-]": 61, "[Li]": 62, "[H]": 63, "[2H]": 64, "[NH4+]": 65, "[c-]": 66, "[P-]": 67, "[Cs+]": 68, "[Li+]": 69, "[Cs]": 70, "[NaH]": 71, "[H-]": 72, "[O+]": 73, "[BH4-]": 74, "[Cu]": 75, "7": 76, "[Mg]": 77, "[Fe+2]": 78, "[n+]": 79, "[Sn]": 80, "[BH-]": 81, "[Pd+2]": 82, "[CH]": 83, "[I-]": 84, "[Br-]": 85, "[C-]": 86, "[Zn]": 87, "[B-]": 88, "[F-]": 89, "[Al]": 90, "[P+]": 91, "[BH3-]": 92, "[Fe]": 93, "[C]": 94, "[AlH4]": 95, "[Ni]": 96, "[SiH]": 97, "8": 98, "[Cu+2]": 99, "[Mn]": 100, "[AlH]": 101, "[nH+]": 102, "[AlH4-]": 103, "[O-2]": 104, "[Cr]": 105, "[Mg+2]": 106, "[NH3+]": 107, "[S@]": 108, "[Pt]": 109, "[Al+3]": 110, "[S@@]": 111, "[S-]": 112, "[Ti]": 113, "[Zn+2]": 114, "[PH]": 115, "[NH2+]": 116, "[Ru]": 117, "[Ag+]": 118, "[S+]": 119, "[I+3]": 120, "[NH+]": 121, "[Ca+2]": 122, "[Ag]": 123, "9": 124, "[Os]": 125, "[Se]": 126, "[SiH2]": 127, "[Ca]": 128, "[Ti+4]": 129, "[Ac]": 130, "[Cu+]": 131, "[S]": 132, "[Rh]": 133, "[Cl+3]": 134, "[cH-]": 135, "[Zn+]": 136, "[O]": 137, "[Cl+]": 138, "[SH]": 139, "[H+]": 140, "[Pd+]": 141, "[se]": 142, "[PH+]": 143, "[I]": 144, "[Pt+2]": 145, "[C+]": 146, "[Mg+]": 147, "[Hg]": 148, "[W]": 149, "[SnH]": 150, "[SiH3]": 151, "[Fe+3]": 152, "[NH]": 153, "[Mo]": 154, "[CH2+]": 155, "%10": 156, "[CH2-]": 157, "[CH2]": 158, "[n-]": 159, "[Ce+4]": 160, "[NH-]": 161, "[Co]": 162, "[I+]": 163, "[PH2]": 164, "[Pt+4]": 165, "[Ce]": 166, "[B]": 167, "[Sn+2]": 168, "[Ba+2]": 169, "%11": 170, "[Fe-3]": 171, "[18F]": 172, "[SH-]": 173, "[Pb+2]": 174, "[Os-2]": 175, "[Zr+4]": 176, "[N]": 177, "[Ir]": 178, "[Bi]": 179, "[Ni+2]": 180, "[P@]": 181, "[Co+2]": 182, "[s+]": 183, "[As]": 184, "[P+3]": 185, "[Hg+2]": 186, "[Yb+3]": 187, "[CH-]": 188, "[Zr+2]": 189, "[Mn+2]": 190, "[CH+]": 191, "[In]": 192, "[KH]": 193, "[Ce+3]": 194, "[Zr]": 195, "[AlH2-]": 196, "[OH2+]": 197, "[Ti+3]": 198, "[Rh+2]": 199, "[Sb]": 200, "[S-2]": 201, "%12": 202, "[P@@]": 203, "[Si@H]": 204, "[Mn+4]": 205, "p": 206, "[Ba]": 207, "[NH2-]": 208, "[Ge]": 209, "[Pb+4]": 210, "[Cr+3]": 211, "[Au]": 212, "[LiH]": 213, "[Sc+3]": 214, "[o+]": 215, "[Rh-3]": 216, "%13": 217, "[Br]": 218, "[Sb-]": 219, "[S@+]": 220, "[I+2]": 221, "[Ar]": 222, "[V]": 223, "[Cu-]": 224, "[Al-]": 225, "[Te]": 226, "[13c]": 227, "[13C]": 228, "[Cl]": 229, "[PH4+]": 230, "[SiH4]": 231, "[te]": 232, "[CH3-]": 233, "[S@@+]": 234, "[Rh+3]": 235, "[SH+]": 236, "[Bi+3]": 237, "[Br+2]": 238, "[La]": 239, "[La+3]": 240, "[Pt-2]": 241, "[N@@]": 242, "[PH3+]": 243, "[N@]": 244, "[Si+4]": 245, "[Sr+2]": 246, "[Al+]": 247, "[Pb]": 248, "[SeH]": 249, "[Si-]": 250, "[V+5]": 251, "[Y+3]": 252, "[Re]": 253, "[Ru+]": 254, "[Sm]": 255, "*": 256, "[3H]": 257, "[NH2]": 258, "[Ag-]": 259, "[13CH3]": 260, "[OH+]": 261, "[Ru+3]": 262, "[OH]": 263, "[Gd+3]": 264, "[13CH2]": 265, "[In+3]": 266, "[Si@@]": 267, "[Si@]": 268, "[Ti+2]": 269, "[Sn+]": 270, "[Cl+2]": 271, "[AlH-]": 272, "[Pd-2]": 273, "[SnH3]": 274, "[B+3]": 275, "[Cu-2]": 276, "[Nd+3]": 277, "[Pb+3]": 278, "[13cH]": 279, "[Fe-4]": 280, "[Ga]": 281, "[Sn+4]": 282, "[Hg+]": 283, "[11CH3]": 284, "[Hf]": 285, "[Pr]": 286, "[Y]": 287, "[S+2]": 288, "[Cd]": 289, "[Cr+6]": 290, "[Zr+3]": 291, "[Rh+]": 292, "[CH3]": 293, "[N-3]": 294, "[Hf+2]": 295, "[Th]": 296, "[Sb+3]": 297, "%14": 298, "[Cr+2]": 299, "[Ru+2]": 300, "[Hf+4]": 301, "[14C]": 302, "[Ta]": 303, "[Tl+]": 304, "[B+]": 305, "[Os+4]": 306, "[PdH2]": 307, "[Pd-]": 308, "[Cd+2]": 309, "[Co+3]": 310, "[S+4]": 311, "[Nb+5]": 312, "[123I]": 313, "[c+]": 314, "[Rb+]": 315, "[V+2]": 316, "[CH3+]": 317, "[Ag+2]": 318, "[cH+]": 319, "[Mn+3]": 320, "[Se-]": 321, "[As-]": 322, "[Eu+3]": 323, "[SH2]": 324, "[Sm+3]": 325, "[IH+]": 326, "%15": 327, "[OH3+]": 328, "[PH3]": 329, "[IH2+]": 330, "[SH2+]": 331, "[Ir+3]": 332, "[AlH3]": 333, "[Sc]": 334, "[Yb]": 335, "[15NH2]": 336, "[Lu]": 337, "[sH+]": 338, "[Gd]": 339, "[18F-]": 340, "[SH3+]": 341, "[SnH4]": 342, "[TeH]": 343, "[Si@@H]": 344, "[Ga+3]": 345, "[CaH2]": 346, "[Tl]": 347, "[Ta+5]": 348, "[GeH]": 349, "[Br+]": 350, "[Sr]": 351, "[Tl+3]": 352, "[Sm+2]": 353, "[PH5]": 354, "%16": 355, "[N@@+]": 356, "[Au+3]": 357, "[C-4]": 358, "[Nd]": 359, "[Ti+]": 360, "[IH]": 361, "[N@+]": 362, "[125I]": 363, "[Eu]": 364, "[Sn+3]": 365, "[Nb]": 366, "[Er+3]": 367, "[123I-]": 368, "[14c]": 369, "%17": 370, "[SnH2]": 371, "[YH]": 372, "[Sb+5]": 373, "[Pr+3]": 374, "[Ir+]": 375, "[N+3]": 376, "[AlH2]": 377, "[19F]": 378, "%18": 379, "[Tb]": 380, "[14CH]": 381, "[Mo+4]": 382, "[Si+]": 383, "[BH]": 384, "[Be]": 385, "[Rb]": 386, "[pH]": 387, "%19": 388, "%20": 389, "[Xe]": 390, "[Ir-]": 391, "[Be+2]": 392, "[C+4]": 393, "[RuH2]": 394, "[15NH]": 395, "[U+2]": 396, "[Au-]": 397, "%21": 398, "%22": 399, "[Au+]": 400, "[15n]": 401, "[Al+2]": 402, "[Tb+3]": 403, "[15N]": 404, "[V+3]": 405, "[W+6]": 406, "[14CH3]": 407, "[Cr+4]": 408, "[ClH+]": 409, "b": 410, "[Ti+6]": 411, "[Nd+]": 412, "[Zr+]": 413, "[PH2+]": 414, "[Fm]": 415, "[N@H+]": 416, "[RuH]": 417, "[Dy+3]": 418, "%23": 419, "[Hf+3]": 420, "[W+4]": 421, "[11C]": 422, "[13CH]": 423, "[Er]": 424, "[124I]": 425, "[LaH]": 426, "[F]": 427, "[siH]": 428, "[Ga+]": 429, "[Cm]": 430, "[GeH3]": 431, "[IH-]": 432, "[U+6]": 433, "[SeH+]": 434, "[32P]": 435, "[SeH-]": 436, "[Pt-]": 437, "[Ir+2]": 438, "[se+]": 439, "[U]": 440, "[F+]": 441, "[BH2]": 442, "[As+]": 443, "[Cf]": 444, "[ClH2+]": 445, "[Ni+]": 446, "[TeH3]": 447, "[SbH2]": 448, "[Ag+3]": 449, "%24": 450, "[18O]": 451, "[PH4]": 452, "[Os+2]": 453, "[Na-]": 454, "[Sb+2]": 455, "[V+4]": 456, "[Ho+3]": 457, "[68Ga]": 458, "[PH-]": 459, "[Bi+2]": 460, "[Ce+2]": 461, "[Pd+3]": 462, "[99Tc]": 463, "[13C@@H]": 464, "[Fe+6]": 465, "[c]": 466, "[GeH2]": 467, "[10B]": 468, "[Cu+3]": 469, "[Mo+2]": 470, "[Cr+]": 471, "[Pd+4]": 472, "[Dy]": 473, "[AsH]": 474, "[Ba+]": 475, "[SeH2]": 476, "[In+]": 477, "[TeH2]": 478, "[BrH+]": 479, "[14cH]": 480, "[W+]": 481, "[13C@H]": 482, "[AsH2]": 483, "[In+2]": 484, "[N+2]": 485, "[N@@H+]": 486, "[SbH]": 487, "[60Co]": 488, "[AsH4+]": 489, "[AsH3]": 490, "[18OH]": 491, "[Ru-2]": 492, "[Na-2]": 493, "[CuH2]": 494, "[31P]": 495, "[Ti+5]": 496, "[35S]": 497, "[P@@H]": 498, "[ArH]": 499, "[Co+]": 500, "[Zr-2]": 501, "[BH2-]": 502, "[131I]": 503, "[SH5]": 504, "[VH]": 505, "[B+2]": 506, "[Yb+2]": 507, "[14C@H]": 508, "[211At]": 509, "[NH3+2]": 510, "[IrH]": 511, "[IrH2]": 512, "[Rh-]": 513, "[Cr-]": 514, "[Sb+]": 515, "[Ni+3]": 516, "[TaH3]": 517, "[Tl+2]": 518, "[64Cu]": 519, "[Tc]": 520, "[Cd+]": 521, "[1H]": 522, "[15nH]": 523, "[AlH2+]": 524, "[FH+2]": 525, "[BiH3]": 526, "[Ru-]": 527, "[Mo+6]": 528, "[AsH+]": 529, "[BaH2]": 530, "[BaH]": 531, "[Fe+4]": 532, "[229Th]": 533, "[Th+4]": 534, "[As+3]": 535, "[NH+3]": 536, "[P@H]": 537, "[Li-]": 538, "[7NaH]": 539, "[Bi+]": 540, "[PtH+2]": 541, "[p-]": 542, "[Re+5]": 543, "[NiH]": 544, "[Ni-]": 545, "[Xe+]": 546, "[Ca+]": 547, "[11c]": 548, "[Rh+4]": 549, "[AcH]": 550, "[HeH]": 551, "[Sc+2]": 552, "[Mn+]": 553, "[UH]": 554, "[14CH2]": 555, "[SiH4+]": 556, "[18OH2]": 557, "[Ac-]": 558, "[Re+4]": 559, "[118Sn]": 560, "[153Sm]": 561, "[P+2]": 562, "[9CH]": 563, "[9CH3]": 564, "[Y-]": 565, "[NiH2]": 566, "[Si+2]": 567, "[Mn+6]": 568, "[ZrH2]": 569, "[C-2]": 570, "[Bi+5]": 571, "[24NaH]": 572, "[Fr]": 573, "[15CH]": 574, "[Se+]": 575, "[At]": 576, "[P-3]": 577, "[124I-]": 578, "[CuH2-]": 579, "[Nb+4]": 580, "[Nb+3]": 581, "[MgH]": 582, "[Ir+4]": 583, "[67Ga+3]": 584, "[67Ga]": 585, "[13N]": 586, "[15OH2]": 587, "[2NH]": 588, "[Ho]": 589, "[Cn]": 590 }, "merges": [] } }