| { |
| "version": "1.0", |
| "truncation": { |
| "direction": "Right", |
| "max_length": 512, |
| "strategy": "LongestFirst", |
| "stride": 0 |
| }, |
| "padding": { |
| "strategy": { |
| "Fixed": 512 |
| }, |
| "direction": "Right", |
| "pad_to_multiple_of": null, |
| "pad_id": 0, |
| "pad_type_id": 0, |
| "pad_token": "[PAD]" |
| }, |
| "added_tokens": [ |
| { |
| "id": 0, |
| "content": "[PAD]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": true, |
| "special": true |
| }, |
| { |
| "id": 11, |
| "content": "[UNK]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": true, |
| "special": true |
| }, |
| { |
| "id": 12, |
| "content": "[CLS]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": true, |
| "special": true |
| }, |
| { |
| "id": 13, |
| "content": "[SEP]", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": true, |
| "special": true |
| }, |
| { |
| "id": 14, |
| "content": "[MASK]", |
| "single_word": false, |
| "lstrip": true, |
| "rstrip": false, |
| "normalized": false, |
| "special": true |
| }, |
| { |
| "id": 591, |
| "content": "<s>", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": true, |
| "special": true |
| }, |
| { |
| "id": 592, |
| "content": "</s>", |
| "single_word": false, |
| "lstrip": false, |
| "rstrip": false, |
| "normalized": true, |
| "special": true |
| } |
| ], |
| "normalizer": null, |
| "pre_tokenizer": { |
| "type": "ByteLevel", |
| "add_prefix_space": false, |
| "trim_offsets": true, |
| "use_regex": true |
| }, |
| "post_processor": { |
| "type": "RobertaProcessing", |
| "sep": [ |
| "[SEP]", |
| 13 |
| ], |
| "cls": [ |
| "[CLS]", |
| 12 |
| ], |
| "trim_offsets": true, |
| "add_prefix_space": false |
| }, |
| "decoder": { |
| "type": "ByteLevel", |
| "add_prefix_space": true, |
| "trim_offsets": true, |
| "use_regex": true |
| }, |
| "model": { |
| "type": "BPE", |
| "dropout": null, |
| "unk_token": null, |
| "continuing_subword_prefix": "", |
| "end_of_word_suffix": "", |
| "fuse_unk": false, |
| "byte_fallback": false, |
| "ignore_merges": false, |
| "vocab": { |
| "[PAD]": 0, |
| "[unused1]": 1, |
| "[unused2]": 2, |
| "[unused3]": 3, |
| "[unused4]": 4, |
| "[unused5]": 5, |
| "[unused6]": 6, |
| "[unused7]": 7, |
| "[unused8]": 8, |
| "[unused9]": 9, |
| "[unused10]": 10, |
| "[UNK]": 11, |
| "[CLS]": 12, |
| "[SEP]": 13, |
| "[MASK]": 14, |
| "c": 15, |
| "C": 16, |
| "(": 17, |
| ")": 18, |
| "O": 19, |
| "1": 20, |
| "2": 21, |
| "=": 22, |
| "N": 23, |
| ".": 24, |
| "n": 25, |
| "3": 26, |
| "F": 27, |
| "Cl": 28, |
| ">>": 29, |
| "~": 30, |
| "-": 31, |
| "4": 32, |
| "[C@H]": 33, |
| "S": 34, |
| "[C@@H]": 35, |
| "[O-]": 36, |
| "Br": 37, |
| "#": 38, |
| "/": 39, |
| "[nH]": 40, |
| "[N+]": 41, |
| "s": 42, |
| "5": 43, |
| "o": 44, |
| "P": 45, |
| "[Na+]": 46, |
| "[Si]": 47, |
| "I": 48, |
| "[Na]": 49, |
| "[Pd]": 50, |
| "[K+]": 51, |
| "[K]": 52, |
| "[P]": 53, |
| "B": 54, |
| "[C@]": 55, |
| "[C@@]": 56, |
| "[Cl-]": 57, |
| "6": 58, |
| "[OH-]": 59, |
| "\\": 60, |
| "[N-]": 61, |
| "[Li]": 62, |
| "[H]": 63, |
| "[2H]": 64, |
| "[NH4+]": 65, |
| "[c-]": 66, |
| "[P-]": 67, |
| "[Cs+]": 68, |
| "[Li+]": 69, |
| "[Cs]": 70, |
| "[NaH]": 71, |
| "[H-]": 72, |
| "[O+]": 73, |
| "[BH4-]": 74, |
| "[Cu]": 75, |
| "7": 76, |
| "[Mg]": 77, |
| "[Fe+2]": 78, |
| "[n+]": 79, |
| "[Sn]": 80, |
| "[BH-]": 81, |
| "[Pd+2]": 82, |
| "[CH]": 83, |
| "[I-]": 84, |
| "[Br-]": 85, |
| "[C-]": 86, |
| "[Zn]": 87, |
| "[B-]": 88, |
| "[F-]": 89, |
| "[Al]": 90, |
| "[P+]": 91, |
| "[BH3-]": 92, |
| "[Fe]": 93, |
| "[C]": 94, |
| "[AlH4]": 95, |
| "[Ni]": 96, |
| "[SiH]": 97, |
| "8": 98, |
| "[Cu+2]": 99, |
| "[Mn]": 100, |
| "[AlH]": 101, |
| "[nH+]": 102, |
| "[AlH4-]": 103, |
| "[O-2]": 104, |
| "[Cr]": 105, |
| "[Mg+2]": 106, |
| "[NH3+]": 107, |
| "[S@]": 108, |
| "[Pt]": 109, |
| "[Al+3]": 110, |
| "[S@@]": 111, |
| "[S-]": 112, |
| "[Ti]": 113, |
| "[Zn+2]": 114, |
| "[PH]": 115, |
| "[NH2+]": 116, |
| "[Ru]": 117, |
| "[Ag+]": 118, |
| "[S+]": 119, |
| "[I+3]": 120, |
| "[NH+]": 121, |
| "[Ca+2]": 122, |
| "[Ag]": 123, |
| "9": 124, |
| "[Os]": 125, |
| "[Se]": 126, |
| "[SiH2]": 127, |
| "[Ca]": 128, |
| "[Ti+4]": 129, |
| "[Ac]": 130, |
| "[Cu+]": 131, |
| "[S]": 132, |
| "[Rh]": 133, |
| "[Cl+3]": 134, |
| "[cH-]": 135, |
| "[Zn+]": 136, |
| "[O]": 137, |
| "[Cl+]": 138, |
| "[SH]": 139, |
| "[H+]": 140, |
| "[Pd+]": 141, |
| "[se]": 142, |
| "[PH+]": 143, |
| "[I]": 144, |
| "[Pt+2]": 145, |
| "[C+]": 146, |
| "[Mg+]": 147, |
| "[Hg]": 148, |
| "[W]": 149, |
| "[SnH]": 150, |
| "[SiH3]": 151, |
| "[Fe+3]": 152, |
| "[NH]": 153, |
| "[Mo]": 154, |
| "[CH2+]": 155, |
| "%10": 156, |
| "[CH2-]": 157, |
| "[CH2]": 158, |
| "[n-]": 159, |
| "[Ce+4]": 160, |
| "[NH-]": 161, |
| "[Co]": 162, |
| "[I+]": 163, |
| "[PH2]": 164, |
| "[Pt+4]": 165, |
| "[Ce]": 166, |
| "[B]": 167, |
| "[Sn+2]": 168, |
| "[Ba+2]": 169, |
| "%11": 170, |
| "[Fe-3]": 171, |
| "[18F]": 172, |
| "[SH-]": 173, |
| "[Pb+2]": 174, |
| "[Os-2]": 175, |
| "[Zr+4]": 176, |
| "[N]": 177, |
| "[Ir]": 178, |
| "[Bi]": 179, |
| "[Ni+2]": 180, |
| "[P@]": 181, |
| "[Co+2]": 182, |
| "[s+]": 183, |
| "[As]": 184, |
| "[P+3]": 185, |
| "[Hg+2]": 186, |
| "[Yb+3]": 187, |
| "[CH-]": 188, |
| "[Zr+2]": 189, |
| "[Mn+2]": 190, |
| "[CH+]": 191, |
| "[In]": 192, |
| "[KH]": 193, |
| "[Ce+3]": 194, |
| "[Zr]": 195, |
| "[AlH2-]": 196, |
| "[OH2+]": 197, |
| "[Ti+3]": 198, |
| "[Rh+2]": 199, |
| "[Sb]": 200, |
| "[S-2]": 201, |
| "%12": 202, |
| "[P@@]": 203, |
| "[Si@H]": 204, |
| "[Mn+4]": 205, |
| "p": 206, |
| "[Ba]": 207, |
| "[NH2-]": 208, |
| "[Ge]": 209, |
| "[Pb+4]": 210, |
| "[Cr+3]": 211, |
| "[Au]": 212, |
| "[LiH]": 213, |
| "[Sc+3]": 214, |
| "[o+]": 215, |
| "[Rh-3]": 216, |
| "%13": 217, |
| "[Br]": 218, |
| "[Sb-]": 219, |
| "[S@+]": 220, |
| "[I+2]": 221, |
| "[Ar]": 222, |
| "[V]": 223, |
| "[Cu-]": 224, |
| "[Al-]": 225, |
| "[Te]": 226, |
| "[13c]": 227, |
| "[13C]": 228, |
| "[Cl]": 229, |
| "[PH4+]": 230, |
| "[SiH4]": 231, |
| "[te]": 232, |
| "[CH3-]": 233, |
| "[S@@+]": 234, |
| "[Rh+3]": 235, |
| "[SH+]": 236, |
| "[Bi+3]": 237, |
| "[Br+2]": 238, |
| "[La]": 239, |
| "[La+3]": 240, |
| "[Pt-2]": 241, |
| "[N@@]": 242, |
| "[PH3+]": 243, |
| "[N@]": 244, |
| "[Si+4]": 245, |
| "[Sr+2]": 246, |
| "[Al+]": 247, |
| "[Pb]": 248, |
| "[SeH]": 249, |
| "[Si-]": 250, |
| "[V+5]": 251, |
| "[Y+3]": 252, |
| "[Re]": 253, |
| "[Ru+]": 254, |
| "[Sm]": 255, |
| "*": 256, |
| "[3H]": 257, |
| "[NH2]": 258, |
| "[Ag-]": 259, |
| "[13CH3]": 260, |
| "[OH+]": 261, |
| "[Ru+3]": 262, |
| "[OH]": 263, |
| "[Gd+3]": 264, |
| "[13CH2]": 265, |
| "[In+3]": 266, |
| "[Si@@]": 267, |
| "[Si@]": 268, |
| "[Ti+2]": 269, |
| "[Sn+]": 270, |
| "[Cl+2]": 271, |
| "[AlH-]": 272, |
| "[Pd-2]": 273, |
| "[SnH3]": 274, |
| "[B+3]": 275, |
| "[Cu-2]": 276, |
| "[Nd+3]": 277, |
| "[Pb+3]": 278, |
| "[13cH]": 279, |
| "[Fe-4]": 280, |
| "[Ga]": 281, |
| "[Sn+4]": 282, |
| "[Hg+]": 283, |
| "[11CH3]": 284, |
| "[Hf]": 285, |
| "[Pr]": 286, |
| "[Y]": 287, |
| "[S+2]": 288, |
| "[Cd]": 289, |
| "[Cr+6]": 290, |
| "[Zr+3]": 291, |
| "[Rh+]": 292, |
| "[CH3]": 293, |
| "[N-3]": 294, |
| "[Hf+2]": 295, |
| "[Th]": 296, |
| "[Sb+3]": 297, |
| "%14": 298, |
| "[Cr+2]": 299, |
| "[Ru+2]": 300, |
| "[Hf+4]": 301, |
| "[14C]": 302, |
| "[Ta]": 303, |
| "[Tl+]": 304, |
| "[B+]": 305, |
| "[Os+4]": 306, |
| "[PdH2]": 307, |
| "[Pd-]": 308, |
| "[Cd+2]": 309, |
| "[Co+3]": 310, |
| "[S+4]": 311, |
| "[Nb+5]": 312, |
| "[123I]": 313, |
| "[c+]": 314, |
| "[Rb+]": 315, |
| "[V+2]": 316, |
| "[CH3+]": 317, |
| "[Ag+2]": 318, |
| "[cH+]": 319, |
| "[Mn+3]": 320, |
| "[Se-]": 321, |
| "[As-]": 322, |
| "[Eu+3]": 323, |
| "[SH2]": 324, |
| "[Sm+3]": 325, |
| "[IH+]": 326, |
| "%15": 327, |
| "[OH3+]": 328, |
| "[PH3]": 329, |
| "[IH2+]": 330, |
| "[SH2+]": 331, |
| "[Ir+3]": 332, |
| "[AlH3]": 333, |
| "[Sc]": 334, |
| "[Yb]": 335, |
| "[15NH2]": 336, |
| "[Lu]": 337, |
| "[sH+]": 338, |
| "[Gd]": 339, |
| "[18F-]": 340, |
| "[SH3+]": 341, |
| "[SnH4]": 342, |
| "[TeH]": 343, |
| "[Si@@H]": 344, |
| "[Ga+3]": 345, |
| "[CaH2]": 346, |
| "[Tl]": 347, |
| "[Ta+5]": 348, |
| "[GeH]": 349, |
| "[Br+]": 350, |
| "[Sr]": 351, |
| "[Tl+3]": 352, |
| "[Sm+2]": 353, |
| "[PH5]": 354, |
| "%16": 355, |
| "[N@@+]": 356, |
| "[Au+3]": 357, |
| "[C-4]": 358, |
| "[Nd]": 359, |
| "[Ti+]": 360, |
| "[IH]": 361, |
| "[N@+]": 362, |
| "[125I]": 363, |
| "[Eu]": 364, |
| "[Sn+3]": 365, |
| "[Nb]": 366, |
| "[Er+3]": 367, |
| "[123I-]": 368, |
| "[14c]": 369, |
| "%17": 370, |
| "[SnH2]": 371, |
| "[YH]": 372, |
| "[Sb+5]": 373, |
| "[Pr+3]": 374, |
| "[Ir+]": 375, |
| "[N+3]": 376, |
| "[AlH2]": 377, |
| "[19F]": 378, |
| "%18": 379, |
| "[Tb]": 380, |
| "[14CH]": 381, |
| "[Mo+4]": 382, |
| "[Si+]": 383, |
| "[BH]": 384, |
| "[Be]": 385, |
| "[Rb]": 386, |
| "[pH]": 387, |
| "%19": 388, |
| "%20": 389, |
| "[Xe]": 390, |
| "[Ir-]": 391, |
| "[Be+2]": 392, |
| "[C+4]": 393, |
| "[RuH2]": 394, |
| "[15NH]": 395, |
| "[U+2]": 396, |
| "[Au-]": 397, |
| "%21": 398, |
| "%22": 399, |
| "[Au+]": 400, |
| "[15n]": 401, |
| "[Al+2]": 402, |
| "[Tb+3]": 403, |
| "[15N]": 404, |
| "[V+3]": 405, |
| "[W+6]": 406, |
| "[14CH3]": 407, |
| "[Cr+4]": 408, |
| "[ClH+]": 409, |
| "b": 410, |
| "[Ti+6]": 411, |
| "[Nd+]": 412, |
| "[Zr+]": 413, |
| "[PH2+]": 414, |
| "[Fm]": 415, |
| "[N@H+]": 416, |
| "[RuH]": 417, |
| "[Dy+3]": 418, |
| "%23": 419, |
| "[Hf+3]": 420, |
| "[W+4]": 421, |
| "[11C]": 422, |
| "[13CH]": 423, |
| "[Er]": 424, |
| "[124I]": 425, |
| "[LaH]": 426, |
| "[F]": 427, |
| "[siH]": 428, |
| "[Ga+]": 429, |
| "[Cm]": 430, |
| "[GeH3]": 431, |
| "[IH-]": 432, |
| "[U+6]": 433, |
| "[SeH+]": 434, |
| "[32P]": 435, |
| "[SeH-]": 436, |
| "[Pt-]": 437, |
| "[Ir+2]": 438, |
| "[se+]": 439, |
| "[U]": 440, |
| "[F+]": 441, |
| "[BH2]": 442, |
| "[As+]": 443, |
| "[Cf]": 444, |
| "[ClH2+]": 445, |
| "[Ni+]": 446, |
| "[TeH3]": 447, |
| "[SbH2]": 448, |
| "[Ag+3]": 449, |
| "%24": 450, |
| "[18O]": 451, |
| "[PH4]": 452, |
| "[Os+2]": 453, |
| "[Na-]": 454, |
| "[Sb+2]": 455, |
| "[V+4]": 456, |
| "[Ho+3]": 457, |
| "[68Ga]": 458, |
| "[PH-]": 459, |
| "[Bi+2]": 460, |
| "[Ce+2]": 461, |
| "[Pd+3]": 462, |
| "[99Tc]": 463, |
| "[13C@@H]": 464, |
| "[Fe+6]": 465, |
| "[c]": 466, |
| "[GeH2]": 467, |
| "[10B]": 468, |
| "[Cu+3]": 469, |
| "[Mo+2]": 470, |
| "[Cr+]": 471, |
| "[Pd+4]": 472, |
| "[Dy]": 473, |
| "[AsH]": 474, |
| "[Ba+]": 475, |
| "[SeH2]": 476, |
| "[In+]": 477, |
| "[TeH2]": 478, |
| "[BrH+]": 479, |
| "[14cH]": 480, |
| "[W+]": 481, |
| "[13C@H]": 482, |
| "[AsH2]": 483, |
| "[In+2]": 484, |
| "[N+2]": 485, |
| "[N@@H+]": 486, |
| "[SbH]": 487, |
| "[60Co]": 488, |
| "[AsH4+]": 489, |
| "[AsH3]": 490, |
| "[18OH]": 491, |
| "[Ru-2]": 492, |
| "[Na-2]": 493, |
| "[CuH2]": 494, |
| "[31P]": 495, |
| "[Ti+5]": 496, |
| "[35S]": 497, |
| "[P@@H]": 498, |
| "[ArH]": 499, |
| "[Co+]": 500, |
| "[Zr-2]": 501, |
| "[BH2-]": 502, |
| "[131I]": 503, |
| "[SH5]": 504, |
| "[VH]": 505, |
| "[B+2]": 506, |
| "[Yb+2]": 507, |
| "[14C@H]": 508, |
| "[211At]": 509, |
| "[NH3+2]": 510, |
| "[IrH]": 511, |
| "[IrH2]": 512, |
| "[Rh-]": 513, |
| "[Cr-]": 514, |
| "[Sb+]": 515, |
| "[Ni+3]": 516, |
| "[TaH3]": 517, |
| "[Tl+2]": 518, |
| "[64Cu]": 519, |
| "[Tc]": 520, |
| "[Cd+]": 521, |
| "[1H]": 522, |
| "[15nH]": 523, |
| "[AlH2+]": 524, |
| "[FH+2]": 525, |
| "[BiH3]": 526, |
| "[Ru-]": 527, |
| "[Mo+6]": 528, |
| "[AsH+]": 529, |
| "[BaH2]": 530, |
| "[BaH]": 531, |
| "[Fe+4]": 532, |
| "[229Th]": 533, |
| "[Th+4]": 534, |
| "[As+3]": 535, |
| "[NH+3]": 536, |
| "[P@H]": 537, |
| "[Li-]": 538, |
| "[7NaH]": 539, |
| "[Bi+]": 540, |
| "[PtH+2]": 541, |
| "[p-]": 542, |
| "[Re+5]": 543, |
| "[NiH]": 544, |
| "[Ni-]": 545, |
| "[Xe+]": 546, |
| "[Ca+]": 547, |
| "[11c]": 548, |
| "[Rh+4]": 549, |
| "[AcH]": 550, |
| "[HeH]": 551, |
| "[Sc+2]": 552, |
| "[Mn+]": 553, |
| "[UH]": 554, |
| "[14CH2]": 555, |
| "[SiH4+]": 556, |
| "[18OH2]": 557, |
| "[Ac-]": 558, |
| "[Re+4]": 559, |
| "[118Sn]": 560, |
| "[153Sm]": 561, |
| "[P+2]": 562, |
| "[9CH]": 563, |
| "[9CH3]": 564, |
| "[Y-]": 565, |
| "[NiH2]": 566, |
| "[Si+2]": 567, |
| "[Mn+6]": 568, |
| "[ZrH2]": 569, |
| "[C-2]": 570, |
| "[Bi+5]": 571, |
| "[24NaH]": 572, |
| "[Fr]": 573, |
| "[15CH]": 574, |
| "[Se+]": 575, |
| "[At]": 576, |
| "[P-3]": 577, |
| "[124I-]": 578, |
| "[CuH2-]": 579, |
| "[Nb+4]": 580, |
| "[Nb+3]": 581, |
| "[MgH]": 582, |
| "[Ir+4]": 583, |
| "[67Ga+3]": 584, |
| "[67Ga]": 585, |
| "[13N]": 586, |
| "[15OH2]": 587, |
| "[2NH]": 588, |
| "[Ho]": 589, |
| "[Cn]": 590 |
| }, |
| "merges": [] |
| } |
| } |