{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 0, "content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true }, { "id": 1, "content": "<pad>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true }, { "id": 2, "content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true }, { "id": 3, "content": "<unk>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "special": true }, { "id": 4, "content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false, "special": true } ], "normalizer": null, "pre_tokenizer": { "type": "ByteLevel", "add_prefix_space": false, "trim_offsets": true, "use_regex": true }, "post_processor": { "type": "RobertaProcessing", "sep": [ "</s>", 2 ], "cls": [ "<s>", 0 ], "trim_offsets": true, "add_prefix_space": false }, "decoder": { "type": "ByteLevel", "add_prefix_space": true, "trim_offsets": true, "use_regex": true }, "model": { "type": "BPE", "dropout": null, "unk_token": null, "continuing_subword_prefix": "", "end_of_word_suffix": "", "fuse_unk": false, "byte_fallback": false, "ignore_merges": false, "vocab": { "<s>": 0, "<pad>": 1, "</s>": 2, "<unk>": 3, "<mask>": 4, "c": 5, "C": 6, "(": 7, ")": 8, "O": 9, "1": 10, "2": 11, "=": 12, "N": 13, ".": 14, "n": 15, "3": 16, "F": 17, "Cl": 18, ">>": 19, "~": 20, "-": 21, "4": 22, "[C@H]": 23, "S": 24, "[C@@H]": 25, "[O-]": 26, "Br": 27, "#": 28, "/": 29, "[nH]": 30, "[N+]": 31, "s": 32, "5": 33, "o": 34, "P": 35, "[Na+]": 36, "[Si]": 37, "I": 38, "[Na]": 39, "[Pd]": 40, "[K+]": 41, "[K]": 42, "[P]": 43, "B": 44, "[C@]": 45, "[C@@]": 46, "[Cl-]": 47, "6": 48, "[OH-]": 49, "\\": 50, "[N-]": 51, "[Li]": 52, "[H]": 53, "[2H]": 54, "[NH4+]": 55, "[c-]": 56, "[P-]": 57, "[Cs+]": 58, "[Li+]": 59, "[Cs]": 60, "[NaH]": 61, "[H-]": 62, "[O+]": 63, "[BH4-]": 64, "[Cu]": 65, "7": 66, "[Mg]": 67, "[Fe+2]": 68, "[n+]": 69, "[Sn]": 70, "[BH-]": 71, "[Pd+2]": 72, "[CH]": 73, "[I-]": 74, "[Br-]": 75, "[C-]": 76, "[Zn]": 77, "[B-]": 78, "[F-]": 79, "[Al]": 80, "[P+]": 81, "[BH3-]": 82, "[Fe]": 83, "[C]": 84, "[AlH4]": 85, "[Ni]": 86, "[SiH]": 87, "8": 88, "[Cu+2]": 89, "[Mn]": 90, "[AlH]": 91, "[nH+]": 92, "[AlH4-]": 93, "[O-2]": 94, "[Cr]": 95, "[Mg+2]": 96, "[NH3+]": 97, "[S@]": 98, "[Pt]": 99, "[Al+3]": 100, "[S@@]": 101, "[S-]": 102, "[Ti]": 103, "[Zn+2]": 104, "[PH]": 105, "[NH2+]": 106, "[Ru]": 107, "[Ag+]": 108, "[S+]": 109, "[I+3]": 110, "[NH+]": 111, "[Ca+2]": 112, "[Ag]": 113, "9": 114, "[Os]": 115, "[Se]": 116, "[SiH2]": 117, "[Ca]": 118, "[Ti+4]": 119, "[Ac]": 120, "[Cu+]": 121, "[S]": 122, "[Rh]": 123, "[Cl+3]": 124, "[cH-]": 125, "[Zn+]": 126, "[O]": 127, "[Cl+]": 128, "[SH]": 129, "[H+]": 130, "[Pd+]": 131, "[se]": 132, "[PH+]": 133, "[I]": 134, "[Pt+2]": 135, "[C+]": 136, "[Mg+]": 137, "[Hg]": 138, "[W]": 139, "[SnH]": 140, "[SiH3]": 141, "[Fe+3]": 142, "[NH]": 143, "[Mo]": 144, "[CH2+]": 145, "%10": 146, "[CH2-]": 147, "[CH2]": 148, "[n-]": 149, "[Ce+4]": 150, "[NH-]": 151, "[Co]": 152, "[I+]": 153, "[PH2]": 154, "[Pt+4]": 155, "[Ce]": 156, "[B]": 157, "[Sn+2]": 158, "[Ba+2]": 159, "%11": 160, "[Fe-3]": 161, "[18F]": 162, "[SH-]": 163, "[Pb+2]": 164, "[Os-2]": 165, "[Zr+4]": 166, "[N]": 167, "[Ir]": 168, "[Bi]": 169, "[Ni+2]": 170, "[P@]": 171, "[Co+2]": 172, "[s+]": 173, "[As]": 174, "[P+3]": 175, "[Hg+2]": 176, "[Yb+3]": 177, "[CH-]": 178, "[Zr+2]": 179, "[Mn+2]": 180, "[CH+]": 181, "[In]": 182, "[KH]": 183, "[Ce+3]": 184, "[Zr]": 185, "[AlH2-]": 186, "[OH2+]": 187, "[Ti+3]": 188, "[Rh+2]": 189, "[Sb]": 190, "[S-2]": 191, "%12": 192, "[P@@]": 193, "[Si@H]": 194, "[Mn+4]": 195, "p": 196, "[Ba]": 197, "[NH2-]": 198, "[Ge]": 199, "[Pb+4]": 200, "[Cr+3]": 201, "[Au]": 202, "[LiH]": 203, "[Sc+3]": 204, "[o+]": 205, "[Rh-3]": 206, "%13": 207, "[Br]": 208, "[Sb-]": 209, "[S@+]": 210, "[I+2]": 211, "[Ar]": 212, "[V]": 213, "[Cu-]": 214, "[Al-]": 215, "[Te]": 216, "[13c]": 217, "[13C]": 218, "[Cl]": 219, "[PH4+]": 220, "[SiH4]": 221, "[te]": 222, "[CH3-]": 223, "[S@@+]": 224, "[Rh+3]": 225, "[SH+]": 226, "[Bi+3]": 227, "[Br+2]": 228, "[La]": 229, "[La+3]": 230, "[Pt-2]": 231, "[N@@]": 232, "[PH3+]": 233, "[N@]": 234, "[Si+4]": 235, "[Sr+2]": 236, "[Al+]": 237, "[Pb]": 238, "[SeH]": 239, "[Si-]": 240, "[V+5]": 241, "[Y+3]": 242, "[Re]": 243, "[Ru+]": 244, "[Sm]": 245, "*": 246, "[3H]": 247, "[NH2]": 248, "[Ag-]": 249, "[13CH3]": 250, "[OH+]": 251, "[Ru+3]": 252, "[OH]": 253, "[Gd+3]": 254, "[13CH2]": 255, "[In+3]": 256, "[Si@@]": 257, "[Si@]": 258, "[Ti+2]": 259, "[Sn+]": 260, "[Cl+2]": 261, "[AlH-]": 262, "[Pd-2]": 263, "[SnH3]": 264, "[B+3]": 265, "[Cu-2]": 266, "[Nd+3]": 267, "[Pb+3]": 268, "[13cH]": 269, "[Fe-4]": 270, "[Ga]": 271, "[Sn+4]": 272, "[Hg+]": 273, "[11CH3]": 274, "[Hf]": 275, "[Pr]": 276, "[Y]": 277, "[S+2]": 278, "[Cd]": 279, "[Cr+6]": 280, "[Zr+3]": 281, "[Rh+]": 282, "[CH3]": 283, "[N-3]": 284, "[Hf+2]": 285, "[Th]": 286, "[Sb+3]": 287, "%14": 288, "[Cr+2]": 289, "[Ru+2]": 290, "[Hf+4]": 291, "[14C]": 292, "[Ta]": 293, "[Tl+]": 294, "[B+]": 295, "[Os+4]": 296, "[PdH2]": 297, "[Pd-]": 298, "[Cd+2]": 299, "[Co+3]": 300, "[S+4]": 301, "[Nb+5]": 302, "[123I]": 303, "[c+]": 304, "[Rb+]": 305, "[V+2]": 306, "[CH3+]": 307, "[Ag+2]": 308, "[cH+]": 309, "[Mn+3]": 310, "[Se-]": 311, "[As-]": 312, "[Eu+3]": 313, "[SH2]": 314, "[Sm+3]": 315, "[IH+]": 316, "%15": 317, "[OH3+]": 318, "[PH3]": 319, "[IH2+]": 320, "[SH2+]": 321, "[Ir+3]": 322, "[AlH3]": 323, "[Sc]": 324, "[Yb]": 325, "[15NH2]": 326, "[Lu]": 327, "[sH+]": 328, "[Gd]": 329, "[18F-]": 330, "[SH3+]": 331, "[SnH4]": 332, "[TeH]": 333, "[Si@@H]": 334, "[Ga+3]": 335, "[CaH2]": 336, "[Tl]": 337, "[Ta+5]": 338, "[GeH]": 339, "[Br+]": 340, "[Sr]": 341, "[Tl+3]": 342, "[Sm+2]": 343, "[PH5]": 344, "%16": 345, "[N@@+]": 346, "[Au+3]": 347, "[C-4]": 348, "[Nd]": 349, "[Ti+]": 350, "[IH]": 351, "[N@+]": 352, "[125I]": 353, "[Eu]": 354, "[Sn+3]": 355, "[Nb]": 356, "[Er+3]": 357, "[123I-]": 358, "[14c]": 359, "%17": 360, "[SnH2]": 361, "[YH]": 362, "[Sb+5]": 363, "[Pr+3]": 364, "[Ir+]": 365, "[N+3]": 366, "[AlH2]": 367, "[19F]": 368, "%18": 369, "[Tb]": 370, "[14CH]": 371, "[Mo+4]": 372, "[Si+]": 373, "[BH]": 374, "[Be]": 375, "[Rb]": 376, "[pH]": 377, "%19": 378, "%20": 379, "[Xe]": 380, "[Ir-]": 381, "[Be+2]": 382, "[C+4]": 383, "[RuH2]": 384, "[15NH]": 385, "[U+2]": 386, "[Au-]": 387, "%21": 388, "%22": 389, "[Au+]": 390, "[15n]": 391, "[Al+2]": 392, "[Tb+3]": 393, "[15N]": 394, "[V+3]": 395, "[W+6]": 396, "[14CH3]": 397, "[Cr+4]": 398, "[ClH+]": 399, "b": 400, "[Ti+6]": 401, "[Nd+]": 402, "[Zr+]": 403, "[PH2+]": 404, "[Fm]": 405, "[N@H+]": 406, "[RuH]": 407, "[Dy+3]": 408, "%23": 409, "[Hf+3]": 410, "[W+4]": 411, "[11C]": 412, "[13CH]": 413, "[Er]": 414, "[124I]": 415, "[LaH]": 416, "[F]": 417, "[siH]": 418, "[Ga+]": 419, "[Cm]": 420, "[GeH3]": 421, "[IH-]": 422, "[U+6]": 423, "[SeH+]": 424, "[32P]": 425, "[SeH-]": 426, "[Pt-]": 427, "[Ir+2]": 428, "[se+]": 429, "[U]": 430, "[F+]": 431, "[BH2]": 432, "[As+]": 433, "[Cf]": 434, "[ClH2+]": 435, "[Ni+]": 436, "[TeH3]": 437, "[SbH2]": 438, "[Ag+3]": 439, "%24": 440, "[18O]": 441, "[PH4]": 442, "[Os+2]": 443, "[Na-]": 444, "[Sb+2]": 445, "[V+4]": 446, "[Ho+3]": 447, "[68Ga]": 448, "[PH-]": 449, "[Bi+2]": 450, "[Ce+2]": 451, "[Pd+3]": 452, "[99Tc]": 453, "[13C@@H]": 454, "[Fe+6]": 455, "[c]": 456, "[GeH2]": 457, "[10B]": 458, "[Cu+3]": 459, "[Mo+2]": 460, "[Cr+]": 461, "[Pd+4]": 462, "[Dy]": 463, "[AsH]": 464, "[Ba+]": 465, "[SeH2]": 466, "[In+]": 467, "[TeH2]": 468, "[BrH+]": 469, "[14cH]": 470, "[W+]": 471, "[13C@H]": 472, "[AsH2]": 473, "[In+2]": 474, "[N+2]": 475, "[N@@H+]": 476, "[SbH]": 477, "[60Co]": 478, "[AsH4+]": 479, "[AsH3]": 480, "[18OH]": 481, "[Ru-2]": 482, "[Na-2]": 483, "[CuH2]": 484, "[31P]": 485, "[Ti+5]": 486, "[35S]": 487, "[P@@H]": 488, "[ArH]": 489, "[Co+]": 490, "[Zr-2]": 491, "[BH2-]": 492, "[131I]": 493, "[SH5]": 494, "[VH]": 495, "[B+2]": 496, "[Yb+2]": 497, "[14C@H]": 498, "[211At]": 499, "[NH3+2]": 500, "[IrH]": 501, "[IrH2]": 502, "[Rh-]": 503, "[Cr-]": 504, "[Sb+]": 505, "[Ni+3]": 506, "[TaH3]": 507, "[Tl+2]": 508, "[64Cu]": 509, "[Tc]": 510, "[Cd+]": 511, "[1H]": 512, "[15nH]": 513, "[AlH2+]": 514, "[FH+2]": 515, "[BiH3]": 516, "[Ru-]": 517, "[Mo+6]": 518, "[AsH+]": 519, "[BaH2]": 520, "[BaH]": 521, "[Fe+4]": 522, "[229Th]": 523, "[Th+4]": 524, "[As+3]": 525, "[NH+3]": 526, "[P@H]": 527, "[Li-]": 528, "[7NaH]": 529, "[Bi+]": 530, "[PtH+2]": 531, "[p-]": 532, "[Re+5]": 533, "[NiH]": 534, "[Ni-]": 535, "[Xe+]": 536, "[Ca+]": 537, "[11c]": 538, "[Rh+4]": 539, "[AcH]": 540, "[HeH]": 541, "[Sc+2]": 542, "[Mn+]": 543, "[UH]": 544, "[14CH2]": 545, "[SiH4+]": 546, "[18OH2]": 547, "[Ac-]": 548, "[Re+4]": 549, "[118Sn]": 550, "[153Sm]": 551, "[P+2]": 552, "[9CH]": 553, "[9CH3]": 554, "[Y-]": 555, "[NiH2]": 556, "[Si+2]": 557, "[Mn+6]": 558, "[ZrH2]": 559, "[C-2]": 560, "[Bi+5]": 561, "[24NaH]": 562, "[Fr]": 563, "[15CH]": 564, "[Se+]": 565, "[At]": 566, "[P-3]": 567, "[124I-]": 568, "[CuH2-]": 569, "[Nb+4]": 570, "[Nb+3]": 571, "[MgH]": 572, "[Ir+4]": 573, "[67Ga+3]": 574, "[67Ga]": 575, "[13N]": 576, "[15OH2]": 577, "[2NH]": 578, "[Ho]": 579, "[Cn]": 580 }, "merges": [] } }