{ | |
"version": "1.0", | |
"truncation": { | |
"direction": "Right", | |
"max_length": 512, | |
"strategy": "LongestFirst", | |
"stride": 0 | |
}, | |
"padding": { | |
"strategy": "BatchLongest", | |
"direction": "Right", | |
"pad_to_multiple_of": null, | |
"pad_id": 0, | |
"pad_type_id": 0, | |
"pad_token": "[PAD]" | |
}, | |
"added_tokens": [ | |
{ | |
"id": 0, | |
"content": "[PAD]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 11, | |
"content": "[UNK]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 12, | |
"content": "[CLS]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 13, | |
"content": "[SEP]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 14, | |
"content": "[MASK]", | |
"single_word": false, | |
"lstrip": true, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 591, | |
"content": "<s>", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": true, | |
"special": true | |
}, | |
{ | |
"id": 592, | |
"content": "</s>", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": true, | |
"special": true | |
} | |
], | |
"normalizer": null, | |
"pre_tokenizer": { | |
"type": "ByteLevel", | |
"add_prefix_space": false, | |
"trim_offsets": true, | |
"use_regex": true | |
}, | |
"post_processor": { | |
"type": "RobertaProcessing", | |
"sep": [ | |
"[SEP]", | |
13 | |
], | |
"cls": [ | |
"[CLS]", | |
12 | |
], | |
"trim_offsets": true, | |
"add_prefix_space": false | |
}, | |
"decoder": { | |
"type": "ByteLevel", | |
"add_prefix_space": true, | |
"trim_offsets": true, | |
"use_regex": true | |
}, | |
"model": { | |
"type": "BPE", | |
"dropout": null, | |
"unk_token": null, | |
"continuing_subword_prefix": "", | |
"end_of_word_suffix": "", | |
"fuse_unk": false, | |
"byte_fallback": false, | |
"ignore_merges": false, | |
"vocab": { | |
"[PAD]": 0, | |
"[unused1]": 1, | |
"[unused2]": 2, | |
"[unused3]": 3, | |
"[unused4]": 4, | |
"[unused5]": 5, | |
"[unused6]": 6, | |
"[unused7]": 7, | |
"[unused8]": 8, | |
"[unused9]": 9, | |
"[unused10]": 10, | |
"[UNK]": 11, | |
"[CLS]": 12, | |
"[SEP]": 13, | |
"[MASK]": 14, | |
"c": 15, | |
"C": 16, | |
"(": 17, | |
")": 18, | |
"O": 19, | |
"1": 20, | |
"2": 21, | |
"=": 22, | |
"N": 23, | |
".": 24, | |
"n": 25, | |
"3": 26, | |
"F": 27, | |
"Cl": 28, | |
">>": 29, | |
"~": 30, | |
"-": 31, | |
"4": 32, | |
"[C@H]": 33, | |
"S": 34, | |
"[C@@H]": 35, | |
"[O-]": 36, | |
"Br": 37, | |
"#": 38, | |
"/": 39, | |
"[nH]": 40, | |
"[N+]": 41, | |
"s": 42, | |
"5": 43, | |
"o": 44, | |
"P": 45, | |
"[Na+]": 46, | |
"[Si]": 47, | |
"I": 48, | |
"[Na]": 49, | |
"[Pd]": 50, | |
"[K+]": 51, | |
"[K]": 52, | |
"[P]": 53, | |
"B": 54, | |
"[C@]": 55, | |
"[C@@]": 56, | |
"[Cl-]": 57, | |
"6": 58, | |
"[OH-]": 59, | |
"\\": 60, | |
"[N-]": 61, | |
"[Li]": 62, | |
"[H]": 63, | |
"[2H]": 64, | |
"[NH4+]": 65, | |
"[c-]": 66, | |
"[P-]": 67, | |
"[Cs+]": 68, | |
"[Li+]": 69, | |
"[Cs]": 70, | |
"[NaH]": 71, | |
"[H-]": 72, | |
"[O+]": 73, | |
"[BH4-]": 74, | |
"[Cu]": 75, | |
"7": 76, | |
"[Mg]": 77, | |
"[Fe+2]": 78, | |
"[n+]": 79, | |
"[Sn]": 80, | |
"[BH-]": 81, | |
"[Pd+2]": 82, | |
"[CH]": 83, | |
"[I-]": 84, | |
"[Br-]": 85, | |
"[C-]": 86, | |
"[Zn]": 87, | |
"[B-]": 88, | |
"[F-]": 89, | |
"[Al]": 90, | |
"[P+]": 91, | |
"[BH3-]": 92, | |
"[Fe]": 93, | |
"[C]": 94, | |
"[AlH4]": 95, | |
"[Ni]": 96, | |
"[SiH]": 97, | |
"8": 98, | |
"[Cu+2]": 99, | |
"[Mn]": 100, | |
"[AlH]": 101, | |
"[nH+]": 102, | |
"[AlH4-]": 103, | |
"[O-2]": 104, | |
"[Cr]": 105, | |
"[Mg+2]": 106, | |
"[NH3+]": 107, | |
"[S@]": 108, | |
"[Pt]": 109, | |
"[Al+3]": 110, | |
"[S@@]": 111, | |
"[S-]": 112, | |
"[Ti]": 113, | |
"[Zn+2]": 114, | |
"[PH]": 115, | |
"[NH2+]": 116, | |
"[Ru]": 117, | |
"[Ag+]": 118, | |
"[S+]": 119, | |
"[I+3]": 120, | |
"[NH+]": 121, | |
"[Ca+2]": 122, | |
"[Ag]": 123, | |
"9": 124, | |
"[Os]": 125, | |
"[Se]": 126, | |
"[SiH2]": 127, | |
"[Ca]": 128, | |
"[Ti+4]": 129, | |
"[Ac]": 130, | |
"[Cu+]": 131, | |
"[S]": 132, | |
"[Rh]": 133, | |
"[Cl+3]": 134, | |
"[cH-]": 135, | |
"[Zn+]": 136, | |
"[O]": 137, | |
"[Cl+]": 138, | |
"[SH]": 139, | |
"[H+]": 140, | |
"[Pd+]": 141, | |
"[se]": 142, | |
"[PH+]": 143, | |
"[I]": 144, | |
"[Pt+2]": 145, | |
"[C+]": 146, | |
"[Mg+]": 147, | |
"[Hg]": 148, | |
"[W]": 149, | |
"[SnH]": 150, | |
"[SiH3]": 151, | |
"[Fe+3]": 152, | |
"[NH]": 153, | |
"[Mo]": 154, | |
"[CH2+]": 155, | |
"%10": 156, | |
"[CH2-]": 157, | |
"[CH2]": 158, | |
"[n-]": 159, | |
"[Ce+4]": 160, | |
"[NH-]": 161, | |
"[Co]": 162, | |
"[I+]": 163, | |
"[PH2]": 164, | |
"[Pt+4]": 165, | |
"[Ce]": 166, | |
"[B]": 167, | |
"[Sn+2]": 168, | |
"[Ba+2]": 169, | |
"%11": 170, | |
"[Fe-3]": 171, | |
"[18F]": 172, | |
"[SH-]": 173, | |
"[Pb+2]": 174, | |
"[Os-2]": 175, | |
"[Zr+4]": 176, | |
"[N]": 177, | |
"[Ir]": 178, | |
"[Bi]": 179, | |
"[Ni+2]": 180, | |
"[P@]": 181, | |
"[Co+2]": 182, | |
"[s+]": 183, | |
"[As]": 184, | |
"[P+3]": 185, | |
"[Hg+2]": 186, | |
"[Yb+3]": 187, | |
"[CH-]": 188, | |
"[Zr+2]": 189, | |
"[Mn+2]": 190, | |
"[CH+]": 191, | |
"[In]": 192, | |
"[KH]": 193, | |
"[Ce+3]": 194, | |
"[Zr]": 195, | |
"[AlH2-]": 196, | |
"[OH2+]": 197, | |
"[Ti+3]": 198, | |
"[Rh+2]": 199, | |
"[Sb]": 200, | |
"[S-2]": 201, | |
"%12": 202, | |
"[P@@]": 203, | |
"[Si@H]": 204, | |
"[Mn+4]": 205, | |
"p": 206, | |
"[Ba]": 207, | |
"[NH2-]": 208, | |
"[Ge]": 209, | |
"[Pb+4]": 210, | |
"[Cr+3]": 211, | |
"[Au]": 212, | |
"[LiH]": 213, | |
"[Sc+3]": 214, | |
"[o+]": 215, | |
"[Rh-3]": 216, | |
"%13": 217, | |
"[Br]": 218, | |
"[Sb-]": 219, | |
"[S@+]": 220, | |
"[I+2]": 221, | |
"[Ar]": 222, | |
"[V]": 223, | |
"[Cu-]": 224, | |
"[Al-]": 225, | |
"[Te]": 226, | |
"[13c]": 227, | |
"[13C]": 228, | |
"[Cl]": 229, | |
"[PH4+]": 230, | |
"[SiH4]": 231, | |
"[te]": 232, | |
"[CH3-]": 233, | |
"[S@@+]": 234, | |
"[Rh+3]": 235, | |
"[SH+]": 236, | |
"[Bi+3]": 237, | |
"[Br+2]": 238, | |
"[La]": 239, | |
"[La+3]": 240, | |
"[Pt-2]": 241, | |
"[N@@]": 242, | |
"[PH3+]": 243, | |
"[N@]": 244, | |
"[Si+4]": 245, | |
"[Sr+2]": 246, | |
"[Al+]": 247, | |
"[Pb]": 248, | |
"[SeH]": 249, | |
"[Si-]": 250, | |
"[V+5]": 251, | |
"[Y+3]": 252, | |
"[Re]": 253, | |
"[Ru+]": 254, | |
"[Sm]": 255, | |
"*": 256, | |
"[3H]": 257, | |
"[NH2]": 258, | |
"[Ag-]": 259, | |
"[13CH3]": 260, | |
"[OH+]": 261, | |
"[Ru+3]": 262, | |
"[OH]": 263, | |
"[Gd+3]": 264, | |
"[13CH2]": 265, | |
"[In+3]": 266, | |
"[Si@@]": 267, | |
"[Si@]": 268, | |
"[Ti+2]": 269, | |
"[Sn+]": 270, | |
"[Cl+2]": 271, | |
"[AlH-]": 272, | |
"[Pd-2]": 273, | |
"[SnH3]": 274, | |
"[B+3]": 275, | |
"[Cu-2]": 276, | |
"[Nd+3]": 277, | |
"[Pb+3]": 278, | |
"[13cH]": 279, | |
"[Fe-4]": 280, | |
"[Ga]": 281, | |
"[Sn+4]": 282, | |
"[Hg+]": 283, | |
"[11CH3]": 284, | |
"[Hf]": 285, | |
"[Pr]": 286, | |
"[Y]": 287, | |
"[S+2]": 288, | |
"[Cd]": 289, | |
"[Cr+6]": 290, | |
"[Zr+3]": 291, | |
"[Rh+]": 292, | |
"[CH3]": 293, | |
"[N-3]": 294, | |
"[Hf+2]": 295, | |
"[Th]": 296, | |
"[Sb+3]": 297, | |
"%14": 298, | |
"[Cr+2]": 299, | |
"[Ru+2]": 300, | |
"[Hf+4]": 301, | |
"[14C]": 302, | |
"[Ta]": 303, | |
"[Tl+]": 304, | |
"[B+]": 305, | |
"[Os+4]": 306, | |
"[PdH2]": 307, | |
"[Pd-]": 308, | |
"[Cd+2]": 309, | |
"[Co+3]": 310, | |
"[S+4]": 311, | |
"[Nb+5]": 312, | |
"[123I]": 313, | |
"[c+]": 314, | |
"[Rb+]": 315, | |
"[V+2]": 316, | |
"[CH3+]": 317, | |
"[Ag+2]": 318, | |
"[cH+]": 319, | |
"[Mn+3]": 320, | |
"[Se-]": 321, | |
"[As-]": 322, | |
"[Eu+3]": 323, | |
"[SH2]": 324, | |
"[Sm+3]": 325, | |
"[IH+]": 326, | |
"%15": 327, | |
"[OH3+]": 328, | |
"[PH3]": 329, | |
"[IH2+]": 330, | |
"[SH2+]": 331, | |
"[Ir+3]": 332, | |
"[AlH3]": 333, | |
"[Sc]": 334, | |
"[Yb]": 335, | |
"[15NH2]": 336, | |
"[Lu]": 337, | |
"[sH+]": 338, | |
"[Gd]": 339, | |
"[18F-]": 340, | |
"[SH3+]": 341, | |
"[SnH4]": 342, | |
"[TeH]": 343, | |
"[Si@@H]": 344, | |
"[Ga+3]": 345, | |
"[CaH2]": 346, | |
"[Tl]": 347, | |
"[Ta+5]": 348, | |
"[GeH]": 349, | |
"[Br+]": 350, | |
"[Sr]": 351, | |
"[Tl+3]": 352, | |
"[Sm+2]": 353, | |
"[PH5]": 354, | |
"%16": 355, | |
"[N@@+]": 356, | |
"[Au+3]": 357, | |
"[C-4]": 358, | |
"[Nd]": 359, | |
"[Ti+]": 360, | |
"[IH]": 361, | |
"[N@+]": 362, | |
"[125I]": 363, | |
"[Eu]": 364, | |
"[Sn+3]": 365, | |
"[Nb]": 366, | |
"[Er+3]": 367, | |
"[123I-]": 368, | |
"[14c]": 369, | |
"%17": 370, | |
"[SnH2]": 371, | |
"[YH]": 372, | |
"[Sb+5]": 373, | |
"[Pr+3]": 374, | |
"[Ir+]": 375, | |
"[N+3]": 376, | |
"[AlH2]": 377, | |
"[19F]": 378, | |
"%18": 379, | |
"[Tb]": 380, | |
"[14CH]": 381, | |
"[Mo+4]": 382, | |
"[Si+]": 383, | |
"[BH]": 384, | |
"[Be]": 385, | |
"[Rb]": 386, | |
"[pH]": 387, | |
"%19": 388, | |
"%20": 389, | |
"[Xe]": 390, | |
"[Ir-]": 391, | |
"[Be+2]": 392, | |
"[C+4]": 393, | |
"[RuH2]": 394, | |
"[15NH]": 395, | |
"[U+2]": 396, | |
"[Au-]": 397, | |
"%21": 398, | |
"%22": 399, | |
"[Au+]": 400, | |
"[15n]": 401, | |
"[Al+2]": 402, | |
"[Tb+3]": 403, | |
"[15N]": 404, | |
"[V+3]": 405, | |
"[W+6]": 406, | |
"[14CH3]": 407, | |
"[Cr+4]": 408, | |
"[ClH+]": 409, | |
"b": 410, | |
"[Ti+6]": 411, | |
"[Nd+]": 412, | |
"[Zr+]": 413, | |
"[PH2+]": 414, | |
"[Fm]": 415, | |
"[N@H+]": 416, | |
"[RuH]": 417, | |
"[Dy+3]": 418, | |
"%23": 419, | |
"[Hf+3]": 420, | |
"[W+4]": 421, | |
"[11C]": 422, | |
"[13CH]": 423, | |
"[Er]": 424, | |
"[124I]": 425, | |
"[LaH]": 426, | |
"[F]": 427, | |
"[siH]": 428, | |
"[Ga+]": 429, | |
"[Cm]": 430, | |
"[GeH3]": 431, | |
"[IH-]": 432, | |
"[U+6]": 433, | |
"[SeH+]": 434, | |
"[32P]": 435, | |
"[SeH-]": 436, | |
"[Pt-]": 437, | |
"[Ir+2]": 438, | |
"[se+]": 439, | |
"[U]": 440, | |
"[F+]": 441, | |
"[BH2]": 442, | |
"[As+]": 443, | |
"[Cf]": 444, | |
"[ClH2+]": 445, | |
"[Ni+]": 446, | |
"[TeH3]": 447, | |
"[SbH2]": 448, | |
"[Ag+3]": 449, | |
"%24": 450, | |
"[18O]": 451, | |
"[PH4]": 452, | |
"[Os+2]": 453, | |
"[Na-]": 454, | |
"[Sb+2]": 455, | |
"[V+4]": 456, | |
"[Ho+3]": 457, | |
"[68Ga]": 458, | |
"[PH-]": 459, | |
"[Bi+2]": 460, | |
"[Ce+2]": 461, | |
"[Pd+3]": 462, | |
"[99Tc]": 463, | |
"[13C@@H]": 464, | |
"[Fe+6]": 465, | |
"[c]": 466, | |
"[GeH2]": 467, | |
"[10B]": 468, | |
"[Cu+3]": 469, | |
"[Mo+2]": 470, | |
"[Cr+]": 471, | |
"[Pd+4]": 472, | |
"[Dy]": 473, | |
"[AsH]": 474, | |
"[Ba+]": 475, | |
"[SeH2]": 476, | |
"[In+]": 477, | |
"[TeH2]": 478, | |
"[BrH+]": 479, | |
"[14cH]": 480, | |
"[W+]": 481, | |
"[13C@H]": 482, | |
"[AsH2]": 483, | |
"[In+2]": 484, | |
"[N+2]": 485, | |
"[N@@H+]": 486, | |
"[SbH]": 487, | |
"[60Co]": 488, | |
"[AsH4+]": 489, | |
"[AsH3]": 490, | |
"[18OH]": 491, | |
"[Ru-2]": 492, | |
"[Na-2]": 493, | |
"[CuH2]": 494, | |
"[31P]": 495, | |
"[Ti+5]": 496, | |
"[35S]": 497, | |
"[P@@H]": 498, | |
"[ArH]": 499, | |
"[Co+]": 500, | |
"[Zr-2]": 501, | |
"[BH2-]": 502, | |
"[131I]": 503, | |
"[SH5]": 504, | |
"[VH]": 505, | |
"[B+2]": 506, | |
"[Yb+2]": 507, | |
"[14C@H]": 508, | |
"[211At]": 509, | |
"[NH3+2]": 510, | |
"[IrH]": 511, | |
"[IrH2]": 512, | |
"[Rh-]": 513, | |
"[Cr-]": 514, | |
"[Sb+]": 515, | |
"[Ni+3]": 516, | |
"[TaH3]": 517, | |
"[Tl+2]": 518, | |
"[64Cu]": 519, | |
"[Tc]": 520, | |
"[Cd+]": 521, | |
"[1H]": 522, | |
"[15nH]": 523, | |
"[AlH2+]": 524, | |
"[FH+2]": 525, | |
"[BiH3]": 526, | |
"[Ru-]": 527, | |
"[Mo+6]": 528, | |
"[AsH+]": 529, | |
"[BaH2]": 530, | |
"[BaH]": 531, | |
"[Fe+4]": 532, | |
"[229Th]": 533, | |
"[Th+4]": 534, | |
"[As+3]": 535, | |
"[NH+3]": 536, | |
"[P@H]": 537, | |
"[Li-]": 538, | |
"[7NaH]": 539, | |
"[Bi+]": 540, | |
"[PtH+2]": 541, | |
"[p-]": 542, | |
"[Re+5]": 543, | |
"[NiH]": 544, | |
"[Ni-]": 545, | |
"[Xe+]": 546, | |
"[Ca+]": 547, | |
"[11c]": 548, | |
"[Rh+4]": 549, | |
"[AcH]": 550, | |
"[HeH]": 551, | |
"[Sc+2]": 552, | |
"[Mn+]": 553, | |
"[UH]": 554, | |
"[14CH2]": 555, | |
"[SiH4+]": 556, | |
"[18OH2]": 557, | |
"[Ac-]": 558, | |
"[Re+4]": 559, | |
"[118Sn]": 560, | |
"[153Sm]": 561, | |
"[P+2]": 562, | |
"[9CH]": 563, | |
"[9CH3]": 564, | |
"[Y-]": 565, | |
"[NiH2]": 566, | |
"[Si+2]": 567, | |
"[Mn+6]": 568, | |
"[ZrH2]": 569, | |
"[C-2]": 570, | |
"[Bi+5]": 571, | |
"[24NaH]": 572, | |
"[Fr]": 573, | |
"[15CH]": 574, | |
"[Se+]": 575, | |
"[At]": 576, | |
"[P-3]": 577, | |
"[124I-]": 578, | |
"[CuH2-]": 579, | |
"[Nb+4]": 580, | |
"[Nb+3]": 581, | |
"[MgH]": 582, | |
"[Ir+4]": 583, | |
"[67Ga+3]": 584, | |
"[67Ga]": 585, | |
"[13N]": 586, | |
"[15OH2]": 587, | |
"[2NH]": 588, | |
"[Ho]": 589, | |
"[Cn]": 590 | |
}, | |
"merges": [] | |
} | |
} |