commit 6dd5bb7b8d117c82d06993bac2dbbdce921c7bad Author: ModelHub XC Date: Sat May 30 23:22:19 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: wudejian789/MolMetaLM-base Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..a6344aa --- /dev/null +++ b/.gitattributes @@ -0,0 +1,35 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..a4b9539 --- /dev/null +++ b/README.md @@ -0,0 +1,26 @@ +--- +pipeline_tag: text-generation +tags: +- Molecule Language Model +- Physicochemical Knowledge +--- + +refer to https://github.com/CSUBioGroup/MolMetaLM for more details. + +# Usage + +## Prepare tokenizer and model +```python +from transformers import AutoTokenizer, AutoModel +tokenizer = AutoTokenizer.from_pretrained('wudejian789/MolMetaLM-base') +model = AutoModel.from_pretrained('wudejian789/MolMetaLM-base') +``` + +## Obtain molecular representations from SMILES +```python +smi = "COc1cc2c(cc1OC)CC([NH3+])C2" +tokenized_smi = tokenizer(" ".join(list(smi)), return_token_type_ids=False, + return_tensors='pt', max_length=512, padding='longest', truncation=True) +emb_smi = model(**tokenized_smi).last_hidden_state +print(emb_smi.shape) # batch size, seq length, embedding size +``` diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..9662eac --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,782 @@ +{ + ",": 489, + ";": 488, + "[(AAD)ATOM:Ac]": 638, + "[(AAD)ATOM:Ag]": 639, + "[(AAD)ATOM:Al]": 640, + "[(AAD)ATOM:Am]": 641, + "[(AAD)ATOM:Ar]": 642, + "[(AAD)ATOM:As]": 643, + "[(AAD)ATOM:At]": 644, + "[(AAD)ATOM:Au]": 645, + "[(AAD)ATOM:B]": 646, + "[(AAD)ATOM:Ba]": 647, + "[(AAD)ATOM:Be]": 648, + "[(AAD)ATOM:Bi]": 649, + "[(AAD)ATOM:Bk]": 650, + "[(AAD)ATOM:Br]": 651, + "[(AAD)ATOM:C]": 652, + "[(AAD)ATOM:Ca]": 653, + "[(AAD)ATOM:Cd]": 654, + "[(AAD)ATOM:Ce]": 655, + "[(AAD)ATOM:Cf]": 656, + "[(AAD)ATOM:Cl]": 657, + "[(AAD)ATOM:Cm]": 658, + "[(AAD)ATOM:Co]": 659, + "[(AAD)ATOM:Cr]": 660, + "[(AAD)ATOM:Cs]": 661, + "[(AAD)ATOM:Cu]": 662, + "[(AAD)ATOM:Dy]": 663, + "[(AAD)ATOM:Er]": 664, + "[(AAD)ATOM:Es]": 665, + "[(AAD)ATOM:Eu]": 666, + "[(AAD)ATOM:F]": 667, + "[(AAD)ATOM:Fe]": 668, + "[(AAD)ATOM:Fm]": 669, + "[(AAD)ATOM:Ga]": 670, + "[(AAD)ATOM:Gd]": 671, + "[(AAD)ATOM:Ge]": 672, + "[(AAD)ATOM:He]": 673, + "[(AAD)ATOM:Hf]": 674, + "[(AAD)ATOM:Hg]": 675, + "[(AAD)ATOM:Ho]": 676, + "[(AAD)ATOM:I]": 677, + "[(AAD)ATOM:In]": 678, + "[(AAD)ATOM:Ir]": 679, + "[(AAD)ATOM:K]": 680, + "[(AAD)ATOM:Kr]": 681, + "[(AAD)ATOM:La]": 682, + "[(AAD)ATOM:Li]": 683, + "[(AAD)ATOM:Lr]": 684, + "[(AAD)ATOM:Lu]": 685, + "[(AAD)ATOM:Md]": 686, + "[(AAD)ATOM:Mg]": 687, + "[(AAD)ATOM:Mn]": 688, + "[(AAD)ATOM:Mo]": 689, + "[(AAD)ATOM:N]": 690, + "[(AAD)ATOM:Na]": 691, + "[(AAD)ATOM:Nb]": 692, + "[(AAD)ATOM:Nd]": 693, + "[(AAD)ATOM:Ne]": 694, + "[(AAD)ATOM:Ni]": 695, + "[(AAD)ATOM:No]": 696, + "[(AAD)ATOM:Np]": 697, + "[(AAD)ATOM:O]": 698, + "[(AAD)ATOM:Os]": 699, + "[(AAD)ATOM:P]": 700, + "[(AAD)ATOM:Pa]": 701, + "[(AAD)ATOM:Pb]": 702, + "[(AAD)ATOM:Pd]": 703, + "[(AAD)ATOM:Pm]": 704, + "[(AAD)ATOM:Po]": 705, + "[(AAD)ATOM:Pr]": 706, + "[(AAD)ATOM:Pt]": 707, + "[(AAD)ATOM:Pu]": 708, + "[(AAD)ATOM:Rb]": 709, + "[(AAD)ATOM:Re]": 710, + "[(AAD)ATOM:Rh]": 711, + "[(AAD)ATOM:Rn]": 712, + "[(AAD)ATOM:Ru]": 713, + "[(AAD)ATOM:S]": 714, + "[(AAD)ATOM:Sb]": 715, + "[(AAD)ATOM:Sc]": 716, + "[(AAD)ATOM:Se]": 717, + "[(AAD)ATOM:Si]": 718, + "[(AAD)ATOM:Sm]": 719, + "[(AAD)ATOM:Sn]": 720, + "[(AAD)ATOM:Sr]": 721, + "[(AAD)ATOM:Ta]": 722, + "[(AAD)ATOM:Tb]": 723, + "[(AAD)ATOM:Tc]": 724, + "[(AAD)ATOM:Te]": 725, + "[(AAD)ATOM:Th]": 726, + "[(AAD)ATOM:Ti]": 727, + "[(AAD)ATOM:Tl]": 728, + "[(AAD)ATOM:Tm]": 729, + "[(AAD)ATOM:U]": 730, + "[(AAD)ATOM:V]": 731, + "[(AAD)ATOM:W]": 732, + "[(AAD)ATOM:Xe]": 733, + "[(AAD)ATOM:Y]": 734, + "[(AAD)ATOM:Yb]": 735, + "[(AAD)ATOM:Zn]": 736, + "[(AAD)ATOM:Zr]": 737, + "[(DDD)ATOM:Ac]": 538, + "[(DDD)ATOM:Ag]": 539, + "[(DDD)ATOM:Al]": 540, + "[(DDD)ATOM:Am]": 541, + "[(DDD)ATOM:Ar]": 542, + "[(DDD)ATOM:As]": 543, + "[(DDD)ATOM:At]": 544, + "[(DDD)ATOM:Au]": 545, + "[(DDD)ATOM:B]": 546, + "[(DDD)ATOM:Ba]": 547, + "[(DDD)ATOM:Be]": 548, + "[(DDD)ATOM:Bi]": 549, + "[(DDD)ATOM:Bk]": 550, + "[(DDD)ATOM:Br]": 551, + "[(DDD)ATOM:C]": 552, + "[(DDD)ATOM:Ca]": 553, + "[(DDD)ATOM:Cd]": 554, + "[(DDD)ATOM:Ce]": 555, + "[(DDD)ATOM:Cf]": 556, + "[(DDD)ATOM:Cl]": 557, + "[(DDD)ATOM:Cm]": 558, + "[(DDD)ATOM:Co]": 559, + "[(DDD)ATOM:Cr]": 560, + "[(DDD)ATOM:Cs]": 561, + "[(DDD)ATOM:Cu]": 562, + "[(DDD)ATOM:Dy]": 563, + "[(DDD)ATOM:Er]": 564, + "[(DDD)ATOM:Es]": 565, + "[(DDD)ATOM:Eu]": 566, + "[(DDD)ATOM:F]": 567, + "[(DDD)ATOM:Fe]": 568, + "[(DDD)ATOM:Fm]": 569, + "[(DDD)ATOM:Ga]": 570, + "[(DDD)ATOM:Gd]": 571, + "[(DDD)ATOM:Ge]": 572, + "[(DDD)ATOM:He]": 573, + "[(DDD)ATOM:Hf]": 574, + "[(DDD)ATOM:Hg]": 575, + "[(DDD)ATOM:Ho]": 576, + "[(DDD)ATOM:I]": 577, + "[(DDD)ATOM:In]": 578, + "[(DDD)ATOM:Ir]": 579, + "[(DDD)ATOM:K]": 580, + "[(DDD)ATOM:Kr]": 581, + "[(DDD)ATOM:La]": 582, + "[(DDD)ATOM:Li]": 583, + "[(DDD)ATOM:Lr]": 584, + "[(DDD)ATOM:Lu]": 585, + "[(DDD)ATOM:Md]": 586, + "[(DDD)ATOM:Mg]": 587, + "[(DDD)ATOM:Mn]": 588, + "[(DDD)ATOM:Mo]": 589, + "[(DDD)ATOM:N]": 590, + "[(DDD)ATOM:Na]": 591, + "[(DDD)ATOM:Nb]": 592, + "[(DDD)ATOM:Nd]": 593, + "[(DDD)ATOM:Ne]": 594, + "[(DDD)ATOM:Ni]": 595, + "[(DDD)ATOM:No]": 596, + "[(DDD)ATOM:Np]": 597, + "[(DDD)ATOM:O]": 598, + "[(DDD)ATOM:Os]": 599, + "[(DDD)ATOM:P]": 600, + "[(DDD)ATOM:Pa]": 601, + "[(DDD)ATOM:Pb]": 602, + "[(DDD)ATOM:Pd]": 603, + "[(DDD)ATOM:Pm]": 604, + "[(DDD)ATOM:Po]": 605, + "[(DDD)ATOM:Pr]": 606, + "[(DDD)ATOM:Pt]": 607, + "[(DDD)ATOM:Pu]": 608, + "[(DDD)ATOM:Rb]": 609, + "[(DDD)ATOM:Re]": 610, + "[(DDD)ATOM:Rh]": 611, + "[(DDD)ATOM:Rn]": 612, + "[(DDD)ATOM:Ru]": 613, + "[(DDD)ATOM:S]": 614, + "[(DDD)ATOM:Sb]": 615, + "[(DDD)ATOM:Sc]": 616, + "[(DDD)ATOM:Se]": 617, + "[(DDD)ATOM:Si]": 618, + "[(DDD)ATOM:Sm]": 619, + "[(DDD)ATOM:Sn]": 620, + "[(DDD)ATOM:Sr]": 621, + "[(DDD)ATOM:Ta]": 622, + "[(DDD)ATOM:Tb]": 623, + "[(DDD)ATOM:Tc]": 624, + "[(DDD)ATOM:Te]": 625, + "[(DDD)ATOM:Th]": 626, + "[(DDD)ATOM:Ti]": 627, + "[(DDD)ATOM:Tl]": 628, + "[(DDD)ATOM:Tm]": 629, + "[(DDD)ATOM:U]": 630, + "[(DDD)ATOM:V]": 631, + "[(DDD)ATOM:W]": 632, + "[(DDD)ATOM:Xe]": 633, + "[(DDD)ATOM:Y]": 634, + "[(DDD)ATOM:Yb]": 635, + "[(DDD)ATOM:Zn]": 636, + "[(DDD)ATOM:Zr]": 637, + "[(XYZ)ATOM:Ac]": 738, + "[(XYZ)ATOM:Ag]": 739, + "[(XYZ)ATOM:Al]": 740, + "[(XYZ)ATOM:Am]": 741, + "[(XYZ)ATOM:Ar]": 742, + "[(XYZ)ATOM:As]": 743, + "[(XYZ)ATOM:At]": 744, + "[(XYZ)ATOM:Au]": 745, + "[(XYZ)ATOM:B]": 746, + "[(XYZ)ATOM:Ba]": 747, + "[(XYZ)ATOM:Be]": 748, + "[(XYZ)ATOM:Bi]": 749, + "[(XYZ)ATOM:Bk]": 750, + "[(XYZ)ATOM:Br]": 751, + "[(XYZ)ATOM:C]": 752, + "[(XYZ)ATOM:Ca]": 753, + "[(XYZ)ATOM:Cd]": 754, + "[(XYZ)ATOM:Ce]": 755, + "[(XYZ)ATOM:Cf]": 756, + "[(XYZ)ATOM:Cl]": 757, + "[(XYZ)ATOM:Cm]": 758, + "[(XYZ)ATOM:Co]": 759, + "[(XYZ)ATOM:Cr]": 760, + "[(XYZ)ATOM:Cs]": 761, + "[(XYZ)ATOM:Cu]": 762, + "[(XYZ)ATOM:Dy]": 763, + "[(XYZ)ATOM:Er]": 764, + "[(XYZ)ATOM:Es]": 765, + "[(XYZ)ATOM:Eu]": 766, + "[(XYZ)ATOM:F]": 767, + "[(XYZ)ATOM:Fe]": 768, + "[(XYZ)ATOM:Fm]": 769, + "[(XYZ)ATOM:Ga]": 770, + "[(XYZ)ATOM:Gd]": 771, + "[(XYZ)ATOM:Ge]": 772, + "[(XYZ)ATOM:He]": 773, + "[(XYZ)ATOM:Hf]": 774, + "[(XYZ)ATOM:Hg]": 775, + "[(XYZ)ATOM:Ho]": 776, + "[(XYZ)ATOM:I]": 777, + "[(XYZ)ATOM:In]": 778, + "[(XYZ)ATOM:Ir]": 779, + "[(XYZ)ATOM:K]": 780, + "[(XYZ)ATOM:Kr]": 781, + "[(XYZ)ATOM:La]": 782, + "[(XYZ)ATOM:Li]": 783, + "[(XYZ)ATOM:Lr]": 784, + "[(XYZ)ATOM:Lu]": 785, + "[(XYZ)ATOM:Md]": 786, + "[(XYZ)ATOM:Mg]": 787, + "[(XYZ)ATOM:Mn]": 788, + "[(XYZ)ATOM:Mo]": 789, + "[(XYZ)ATOM:N]": 790, + "[(XYZ)ATOM:Na]": 791, + "[(XYZ)ATOM:Nb]": 792, + "[(XYZ)ATOM:Nd]": 793, + "[(XYZ)ATOM:Ne]": 794, + "[(XYZ)ATOM:Ni]": 795, + "[(XYZ)ATOM:No]": 796, + "[(XYZ)ATOM:Np]": 797, + "[(XYZ)ATOM:O]": 798, + "[(XYZ)ATOM:Os]": 799, + "[(XYZ)ATOM:P]": 800, + "[(XYZ)ATOM:Pa]": 801, + "[(XYZ)ATOM:Pb]": 802, + "[(XYZ)ATOM:Pd]": 803, + "[(XYZ)ATOM:Pm]": 804, + "[(XYZ)ATOM:Po]": 805, + "[(XYZ)ATOM:Pr]": 806, + "[(XYZ)ATOM:Pt]": 807, + "[(XYZ)ATOM:Pu]": 808, + "[(XYZ)ATOM:Rb]": 809, + "[(XYZ)ATOM:Re]": 810, + "[(XYZ)ATOM:Rh]": 811, + "[(XYZ)ATOM:Rn]": 812, + "[(XYZ)ATOM:Ru]": 813, + "[(XYZ)ATOM:S]": 814, + "[(XYZ)ATOM:Sb]": 815, + "[(XYZ)ATOM:Sc]": 816, + "[(XYZ)ATOM:Se]": 817, + "[(XYZ)ATOM:Si]": 818, + "[(XYZ)ATOM:Sm]": 819, + "[(XYZ)ATOM:Sn]": 820, + "[(XYZ)ATOM:Sr]": 821, + "[(XYZ)ATOM:Ta]": 822, + "[(XYZ)ATOM:Tb]": 823, + "[(XYZ)ATOM:Tc]": 824, + "[(XYZ)ATOM:Te]": 825, + "[(XYZ)ATOM:Th]": 826, + "[(XYZ)ATOM:Ti]": 827, + "[(XYZ)ATOM:Tl]": 828, + "[(XYZ)ATOM:Tm]": 829, + "[(XYZ)ATOM:U]": 830, + "[(XYZ)ATOM:V]": 831, + "[(XYZ)ATOM:W]": 832, + "[(XYZ)ATOM:Xe]": 833, + "[(XYZ)ATOM:Y]": 834, + "[(XYZ)ATOM:Yb]": 835, + "[(XYZ)ATOM:Zn]": 836, + "[(XYZ)ATOM:Zr]": 837, + "[BITS]": 847, + "[CLS]": 850, + "[CUSPRO]": 848, + "[FPR:Avalon]": 842, + "[FPR:ECFP]": 840, + "[FPR:FCFP]": 841, + "[FPR:MACCS]": 838, + "[FPR:Toplogical]": 839, + "[QM9:A_RC]": 71, + "[QM9:B_RC]": 72, + "[QM9:C_RC]": 73, + "[QM9:Cv_HCat298.15K]": 85, + "[QM9:G_FEat298.15K]": 84, + "[QM9:H_Eat298.15K]": 83, + "[QM9:R2_ESE]": 79, + "[QM9:U_IEat298.15K]": 82, + "[QM9:Uo_IEat0K]": 81, + "[QM9:alpha_IP]": 75, + "[QM9:epsE_HOMO]": 76, + "[QM9:epsE_LUMO]": 77, + "[QM9:eps_GAP]": 78, + "[QM9:miu_DM]": 74, + "[QM9:zpve_ZPVE]": 80, + "[RDKit:AUTOCORR2D_100]": 106, + "[RDKit:AUTOCORR2D_101]": 107, + "[RDKit:AUTOCORR2D_102]": 108, + "[RDKit:AUTOCORR2D_103]": 109, + "[RDKit:AUTOCORR2D_104]": 110, + "[RDKit:AUTOCORR2D_105]": 111, + "[RDKit:AUTOCORR2D_106]": 112, + "[RDKit:AUTOCORR2D_107]": 113, + "[RDKit:AUTOCORR2D_108]": 114, + "[RDKit:AUTOCORR2D_109]": 115, + "[RDKit:AUTOCORR2D_10]": 105, + "[RDKit:AUTOCORR2D_110]": 117, + "[RDKit:AUTOCORR2D_111]": 118, + "[RDKit:AUTOCORR2D_112]": 119, + "[RDKit:AUTOCORR2D_113]": 120, + "[RDKit:AUTOCORR2D_114]": 121, + "[RDKit:AUTOCORR2D_115]": 122, + "[RDKit:AUTOCORR2D_116]": 123, + "[RDKit:AUTOCORR2D_117]": 124, + "[RDKit:AUTOCORR2D_118]": 125, + "[RDKit:AUTOCORR2D_119]": 126, + "[RDKit:AUTOCORR2D_11]": 116, + "[RDKit:AUTOCORR2D_120]": 128, + "[RDKit:AUTOCORR2D_121]": 129, + "[RDKit:AUTOCORR2D_122]": 130, + "[RDKit:AUTOCORR2D_123]": 131, + "[RDKit:AUTOCORR2D_124]": 132, + "[RDKit:AUTOCORR2D_125]": 133, + "[RDKit:AUTOCORR2D_126]": 134, + "[RDKit:AUTOCORR2D_127]": 135, + "[RDKit:AUTOCORR2D_128]": 136, + "[RDKit:AUTOCORR2D_129]": 137, + "[RDKit:AUTOCORR2D_12]": 127, + "[RDKit:AUTOCORR2D_130]": 139, + "[RDKit:AUTOCORR2D_131]": 140, + "[RDKit:AUTOCORR2D_132]": 141, + "[RDKit:AUTOCORR2D_133]": 142, + "[RDKit:AUTOCORR2D_134]": 143, + "[RDKit:AUTOCORR2D_135]": 144, + "[RDKit:AUTOCORR2D_136]": 145, + "[RDKit:AUTOCORR2D_137]": 146, + "[RDKit:AUTOCORR2D_138]": 147, + "[RDKit:AUTOCORR2D_139]": 148, + "[RDKit:AUTOCORR2D_13]": 138, + "[RDKit:AUTOCORR2D_140]": 150, + "[RDKit:AUTOCORR2D_141]": 151, + "[RDKit:AUTOCORR2D_142]": 152, + "[RDKit:AUTOCORR2D_143]": 153, + "[RDKit:AUTOCORR2D_144]": 154, + "[RDKit:AUTOCORR2D_145]": 155, + "[RDKit:AUTOCORR2D_146]": 156, + "[RDKit:AUTOCORR2D_147]": 157, + "[RDKit:AUTOCORR2D_148]": 158, + "[RDKit:AUTOCORR2D_149]": 159, + "[RDKit:AUTOCORR2D_14]": 149, + "[RDKit:AUTOCORR2D_150]": 161, + "[RDKit:AUTOCORR2D_151]": 162, + "[RDKit:AUTOCORR2D_152]": 163, + "[RDKit:AUTOCORR2D_153]": 164, + "[RDKit:AUTOCORR2D_154]": 165, + "[RDKit:AUTOCORR2D_155]": 166, + "[RDKit:AUTOCORR2D_156]": 167, + "[RDKit:AUTOCORR2D_157]": 168, + "[RDKit:AUTOCORR2D_158]": 169, + "[RDKit:AUTOCORR2D_159]": 170, + "[RDKit:AUTOCORR2D_15]": 160, + "[RDKit:AUTOCORR2D_160]": 172, + "[RDKit:AUTOCORR2D_161]": 173, + "[RDKit:AUTOCORR2D_162]": 174, + "[RDKit:AUTOCORR2D_163]": 175, + "[RDKit:AUTOCORR2D_164]": 176, + "[RDKit:AUTOCORR2D_165]": 177, + "[RDKit:AUTOCORR2D_166]": 178, + "[RDKit:AUTOCORR2D_167]": 179, + "[RDKit:AUTOCORR2D_168]": 180, + "[RDKit:AUTOCORR2D_169]": 181, + "[RDKit:AUTOCORR2D_16]": 171, + "[RDKit:AUTOCORR2D_170]": 183, + "[RDKit:AUTOCORR2D_171]": 184, + "[RDKit:AUTOCORR2D_172]": 185, + "[RDKit:AUTOCORR2D_173]": 186, + "[RDKit:AUTOCORR2D_174]": 187, + "[RDKit:AUTOCORR2D_175]": 188, + "[RDKit:AUTOCORR2D_176]": 189, + "[RDKit:AUTOCORR2D_177]": 190, + "[RDKit:AUTOCORR2D_178]": 191, + "[RDKit:AUTOCORR2D_179]": 192, + "[RDKit:AUTOCORR2D_17]": 182, + "[RDKit:AUTOCORR2D_180]": 194, + "[RDKit:AUTOCORR2D_181]": 195, + "[RDKit:AUTOCORR2D_182]": 196, + "[RDKit:AUTOCORR2D_183]": 197, + "[RDKit:AUTOCORR2D_184]": 198, + "[RDKit:AUTOCORR2D_185]": 199, + "[RDKit:AUTOCORR2D_186]": 200, + "[RDKit:AUTOCORR2D_187]": 201, + "[RDKit:AUTOCORR2D_188]": 202, + "[RDKit:AUTOCORR2D_189]": 203, + "[RDKit:AUTOCORR2D_18]": 193, + "[RDKit:AUTOCORR2D_190]": 205, + "[RDKit:AUTOCORR2D_191]": 206, + "[RDKit:AUTOCORR2D_192]": 207, + "[RDKit:AUTOCORR2D_19]": 204, + "[RDKit:AUTOCORR2D_1]": 104, + "[RDKit:AUTOCORR2D_20]": 209, + "[RDKit:AUTOCORR2D_21]": 210, + "[RDKit:AUTOCORR2D_22]": 211, + "[RDKit:AUTOCORR2D_23]": 212, + "[RDKit:AUTOCORR2D_24]": 213, + "[RDKit:AUTOCORR2D_25]": 214, + "[RDKit:AUTOCORR2D_26]": 215, + "[RDKit:AUTOCORR2D_27]": 216, + "[RDKit:AUTOCORR2D_28]": 217, + "[RDKit:AUTOCORR2D_29]": 218, + "[RDKit:AUTOCORR2D_2]": 208, + "[RDKit:AUTOCORR2D_30]": 220, + "[RDKit:AUTOCORR2D_31]": 221, + "[RDKit:AUTOCORR2D_32]": 222, + "[RDKit:AUTOCORR2D_33]": 223, + "[RDKit:AUTOCORR2D_34]": 224, + "[RDKit:AUTOCORR2D_35]": 225, + "[RDKit:AUTOCORR2D_36]": 226, + "[RDKit:AUTOCORR2D_37]": 227, + "[RDKit:AUTOCORR2D_38]": 228, + "[RDKit:AUTOCORR2D_39]": 229, + "[RDKit:AUTOCORR2D_3]": 219, + "[RDKit:AUTOCORR2D_40]": 231, + "[RDKit:AUTOCORR2D_41]": 232, + "[RDKit:AUTOCORR2D_42]": 233, + "[RDKit:AUTOCORR2D_43]": 234, + "[RDKit:AUTOCORR2D_44]": 235, + "[RDKit:AUTOCORR2D_45]": 236, + "[RDKit:AUTOCORR2D_46]": 237, + "[RDKit:AUTOCORR2D_47]": 238, + "[RDKit:AUTOCORR2D_48]": 239, + "[RDKit:AUTOCORR2D_49]": 240, + "[RDKit:AUTOCORR2D_4]": 230, + "[RDKit:AUTOCORR2D_50]": 242, + "[RDKit:AUTOCORR2D_51]": 243, + "[RDKit:AUTOCORR2D_52]": 244, + "[RDKit:AUTOCORR2D_53]": 245, + "[RDKit:AUTOCORR2D_54]": 246, + "[RDKit:AUTOCORR2D_55]": 247, + "[RDKit:AUTOCORR2D_56]": 248, + "[RDKit:AUTOCORR2D_57]": 249, + "[RDKit:AUTOCORR2D_58]": 250, + "[RDKit:AUTOCORR2D_59]": 251, + "[RDKit:AUTOCORR2D_5]": 241, + "[RDKit:AUTOCORR2D_60]": 253, + "[RDKit:AUTOCORR2D_61]": 254, + "[RDKit:AUTOCORR2D_62]": 255, + "[RDKit:AUTOCORR2D_63]": 256, + "[RDKit:AUTOCORR2D_64]": 257, + "[RDKit:AUTOCORR2D_65]": 258, + "[RDKit:AUTOCORR2D_66]": 259, + "[RDKit:AUTOCORR2D_67]": 260, + "[RDKit:AUTOCORR2D_68]": 261, + "[RDKit:AUTOCORR2D_69]": 262, + "[RDKit:AUTOCORR2D_6]": 252, + "[RDKit:AUTOCORR2D_70]": 264, + "[RDKit:AUTOCORR2D_71]": 265, + "[RDKit:AUTOCORR2D_72]": 266, + "[RDKit:AUTOCORR2D_73]": 267, + "[RDKit:AUTOCORR2D_74]": 268, + "[RDKit:AUTOCORR2D_75]": 269, + "[RDKit:AUTOCORR2D_76]": 270, + "[RDKit:AUTOCORR2D_77]": 271, + "[RDKit:AUTOCORR2D_78]": 272, + "[RDKit:AUTOCORR2D_79]": 273, + "[RDKit:AUTOCORR2D_7]": 263, + "[RDKit:AUTOCORR2D_80]": 275, + "[RDKit:AUTOCORR2D_81]": 276, + "[RDKit:AUTOCORR2D_82]": 277, + "[RDKit:AUTOCORR2D_83]": 278, + "[RDKit:AUTOCORR2D_84]": 279, + "[RDKit:AUTOCORR2D_85]": 280, + "[RDKit:AUTOCORR2D_86]": 281, + "[RDKit:AUTOCORR2D_87]": 282, + "[RDKit:AUTOCORR2D_88]": 283, + "[RDKit:AUTOCORR2D_89]": 284, + "[RDKit:AUTOCORR2D_8]": 274, + "[RDKit:AUTOCORR2D_90]": 286, + "[RDKit:AUTOCORR2D_91]": 287, + "[RDKit:AUTOCORR2D_92]": 288, + "[RDKit:AUTOCORR2D_93]": 289, + "[RDKit:AUTOCORR2D_94]": 290, + "[RDKit:AUTOCORR2D_95]": 291, + "[RDKit:AUTOCORR2D_96]": 292, + "[RDKit:AUTOCORR2D_97]": 293, + "[RDKit:AUTOCORR2D_98]": 294, + "[RDKit:AUTOCORR2D_99]": 295, + "[RDKit:AUTOCORR2D_9]": 285, + "[RDKit:AvgIpc]": 296, + "[RDKit:BCUT2D_CHGHI]": 297, + "[RDKit:BCUT2D_CHGLO]": 298, + "[RDKit:BCUT2D_LOGPHI]": 299, + "[RDKit:BCUT2D_LOGPLOW]": 300, + "[RDKit:BCUT2D_MRHI]": 301, + "[RDKit:BCUT2D_MRLOW]": 302, + "[RDKit:BCUT2D_MWHI]": 303, + "[RDKit:BCUT2D_MWLOW]": 304, + "[RDKit:BalabanJ]": 305, + "[RDKit:BertzCT]": 306, + "[RDKit:Chi0]": 307, + "[RDKit:Chi0n]": 308, + "[RDKit:Chi0v]": 309, + "[RDKit:Chi1]": 310, + "[RDKit:Chi1n]": 311, + "[RDKit:Chi1v]": 312, + "[RDKit:Chi2n]": 313, + "[RDKit:Chi2v]": 314, + "[RDKit:Chi3n]": 315, + "[RDKit:Chi3v]": 316, + "[RDKit:Chi4n]": 317, + "[RDKit:Chi4v]": 318, + "[RDKit:EState_VSA10]": 320, + "[RDKit:EState_VSA11]": 321, + "[RDKit:EState_VSA1]": 319, + "[RDKit:EState_VSA2]": 322, + "[RDKit:EState_VSA3]": 323, + "[RDKit:EState_VSA4]": 324, + "[RDKit:EState_VSA5]": 325, + "[RDKit:EState_VSA6]": 326, + "[RDKit:EState_VSA7]": 327, + "[RDKit:EState_VSA8]": 328, + "[RDKit:EState_VSA9]": 329, + "[RDKit:ExactMolWt]": 330, + "[RDKit:FpDensityMorgan1]": 331, + "[RDKit:FpDensityMorgan2]": 332, + "[RDKit:FpDensityMorgan3]": 333, + "[RDKit:FractionCSP3]": 86, + "[RDKit:HallKierAlpha]": 334, + "[RDKit:HeavyAtomCount]": 87, + "[RDKit:HeavyAtomMolWt]": 335, + "[RDKit:Ipc]": 336, + "[RDKit:Kappa1]": 337, + "[RDKit:Kappa2]": 338, + "[RDKit:Kappa3]": 339, + "[RDKit:LabuteASA]": 340, + "[RDKit:MaxAbsEStateIndex]": 341, + "[RDKit:MaxAbsPartialCharge]": 342, + "[RDKit:MaxEStateIndex]": 343, + "[RDKit:MaxPartialCharge]": 344, + "[RDKit:MinAbsEStateIndex]": 345, + "[RDKit:MinAbsPartialCharge]": 346, + "[RDKit:MinEStateIndex]": 347, + "[RDKit:MinPartialCharge]": 348, + "[RDKit:MolLogP]": 349, + "[RDKit:MolMR]": 350, + "[RDKit:MolWt]": 351, + "[RDKit:NHOHCount]": 88, + "[RDKit:NOCount]": 89, + "[RDKit:NumAliphaticCarbocycles]": 90, + "[RDKit:NumAliphaticHeterocycles]": 91, + "[RDKit:NumAliphaticRings]": 92, + "[RDKit:NumAromaticCarbocycles]": 93, + "[RDKit:NumAromaticHeterocycles]": 94, + "[RDKit:NumAromaticRings]": 95, + "[RDKit:NumHAcceptors]": 96, + "[RDKit:NumHDonors]": 97, + "[RDKit:NumHeteroatoms]": 98, + "[RDKit:NumRadicalElectrons]": 352, + "[RDKit:NumRotatableBonds]": 99, + "[RDKit:NumSaturatedCarbocycles]": 100, + "[RDKit:NumSaturatedHeterocycles]": 101, + "[RDKit:NumSaturatedRings]": 102, + "[RDKit:NumValenceElectrons]": 353, + "[RDKit:PEOE_VSA10]": 355, + "[RDKit:PEOE_VSA11]": 356, + "[RDKit:PEOE_VSA12]": 357, + "[RDKit:PEOE_VSA13]": 358, + "[RDKit:PEOE_VSA14]": 359, + "[RDKit:PEOE_VSA1]": 354, + "[RDKit:PEOE_VSA2]": 360, + "[RDKit:PEOE_VSA3]": 361, + "[RDKit:PEOE_VSA4]": 362, + "[RDKit:PEOE_VSA5]": 363, + "[RDKit:PEOE_VSA6]": 364, + "[RDKit:PEOE_VSA7]": 365, + "[RDKit:PEOE_VSA8]": 366, + "[RDKit:PEOE_VSA9]": 367, + "[RDKit:RingCount]": 103, + "[RDKit:SMR_VSA10]": 369, + "[RDKit:SMR_VSA1]": 368, + "[RDKit:SMR_VSA2]": 370, + "[RDKit:SMR_VSA3]": 371, + "[RDKit:SMR_VSA4]": 372, + "[RDKit:SMR_VSA5]": 373, + "[RDKit:SMR_VSA6]": 374, + "[RDKit:SMR_VSA7]": 375, + "[RDKit:SMR_VSA8]": 376, + "[RDKit:SMR_VSA9]": 377, + "[RDKit:SPS]": 378, + "[RDKit:SlogP_VSA10]": 380, + "[RDKit:SlogP_VSA11]": 381, + "[RDKit:SlogP_VSA12]": 382, + "[RDKit:SlogP_VSA1]": 379, + "[RDKit:SlogP_VSA2]": 383, + "[RDKit:SlogP_VSA3]": 384, + "[RDKit:SlogP_VSA4]": 385, + "[RDKit:SlogP_VSA5]": 386, + "[RDKit:SlogP_VSA6]": 387, + "[RDKit:SlogP_VSA7]": 388, + "[RDKit:SlogP_VSA8]": 389, + "[RDKit:SlogP_VSA9]": 390, + "[RDKit:TPSA]": 391, + "[RDKit:VSA_EState10]": 393, + "[RDKit:VSA_EState1]": 392, + "[RDKit:VSA_EState2]": 394, + "[RDKit:VSA_EState3]": 395, + "[RDKit:VSA_EState4]": 396, + "[RDKit:VSA_EState5]": 397, + "[RDKit:VSA_EState6]": 398, + "[RDKit:VSA_EState7]": 399, + "[RDKit:VSA_EState8]": 400, + "[RDKit:VSA_EState9]": 401, + "[RDKit:fr_Al_COO]": 402, + "[RDKit:fr_Al_OH]": 403, + "[RDKit:fr_Al_OH_noTert]": 404, + "[RDKit:fr_ArN]": 405, + "[RDKit:fr_Ar_COO]": 406, + "[RDKit:fr_Ar_NH]": 408, + "[RDKit:fr_Ar_N]": 407, + "[RDKit:fr_Ar_OH]": 409, + "[RDKit:fr_COO2]": 411, + "[RDKit:fr_COO]": 410, + "[RDKit:fr_C_O]": 412, + "[RDKit:fr_C_O_noCOO]": 413, + "[RDKit:fr_C_S]": 414, + "[RDKit:fr_HOCCN]": 415, + "[RDKit:fr_Imine]": 416, + "[RDKit:fr_NH0]": 417, + "[RDKit:fr_NH1]": 418, + "[RDKit:fr_NH2]": 419, + "[RDKit:fr_N_O]": 420, + "[RDKit:fr_Ndealkylation1]": 421, + "[RDKit:fr_Ndealkylation2]": 422, + "[RDKit:fr_Nhpyrrole]": 423, + "[RDKit:fr_SH]": 424, + "[RDKit:fr_aldehyde]": 425, + "[RDKit:fr_alkyl_carbamate]": 426, + "[RDKit:fr_alkyl_halide]": 427, + "[RDKit:fr_allylic_oxid]": 428, + "[RDKit:fr_amide]": 429, + "[RDKit:fr_amidine]": 430, + "[RDKit:fr_aniline]": 431, + "[RDKit:fr_aryl_methyl]": 432, + "[RDKit:fr_azide]": 433, + "[RDKit:fr_azo]": 434, + "[RDKit:fr_barbitur]": 435, + "[RDKit:fr_benzene]": 436, + "[RDKit:fr_benzodiazepine]": 437, + "[RDKit:fr_bicyclic]": 438, + "[RDKit:fr_diazo]": 439, + "[RDKit:fr_dihydropyridine]": 440, + "[RDKit:fr_epoxide]": 441, + "[RDKit:fr_ester]": 442, + "[RDKit:fr_ether]": 443, + "[RDKit:fr_furan]": 444, + "[RDKit:fr_guanido]": 445, + "[RDKit:fr_halogen]": 446, + "[RDKit:fr_hdrzine]": 447, + "[RDKit:fr_hdrzone]": 448, + "[RDKit:fr_imidazole]": 449, + "[RDKit:fr_imide]": 450, + "[RDKit:fr_isocyan]": 451, + "[RDKit:fr_isothiocyan]": 452, + "[RDKit:fr_ketone]": 453, + "[RDKit:fr_ketone_Topliss]": 454, + "[RDKit:fr_lactam]": 455, + "[RDKit:fr_lactone]": 456, + "[RDKit:fr_methoxy]": 457, + "[RDKit:fr_morpholine]": 458, + "[RDKit:fr_nitrile]": 459, + "[RDKit:fr_nitro]": 460, + "[RDKit:fr_nitro_arom]": 461, + "[RDKit:fr_nitro_arom_nonortho]": 462, + "[RDKit:fr_nitroso]": 463, + "[RDKit:fr_oxazole]": 464, + "[RDKit:fr_oxime]": 465, + "[RDKit:fr_para_hydroxylation]": 466, + "[RDKit:fr_phenol]": 467, + "[RDKit:fr_phenol_noOrthoHbond]": 468, + "[RDKit:fr_phos_acid]": 469, + "[RDKit:fr_phos_ester]": 470, + "[RDKit:fr_piperdine]": 471, + "[RDKit:fr_piperzine]": 472, + "[RDKit:fr_priamide]": 473, + "[RDKit:fr_prisulfonamd]": 474, + "[RDKit:fr_pyridine]": 475, + "[RDKit:fr_quatN]": 476, + "[RDKit:fr_sulfide]": 477, + "[RDKit:fr_sulfonamd]": 478, + "[RDKit:fr_sulfone]": 479, + "[RDKit:fr_term_acetylene]": 480, + "[RDKit:fr_tetrazole]": 481, + "[RDKit:fr_thiazole]": 482, + "[RDKit:fr_thiocyan]": 483, + "[RDKit:fr_thiophene]": 484, + "[RDKit:fr_unbrch_alkane]": 485, + "[RDKit:fr_urea]": 486, + "[RDKit:qed]": 487, + "[SEP]": 843, + "[SPAN]": 844, + "[SPM_AAD(PAIR)]": 536, + "[SPM_AAD]": 512, + "[SPM_DDD(PAIR)]": 535, + "[SPM_DDD]": 511, + "[SPM_XYZ(PAIR)]": 537, + "[SPM_XYZ]": 513, + "[SUB]": 849, + "[VALUE]": 845, + "[XYZ]": 846, + "[mGLM_pro_val(PAIR)]": 527, + "[mGLM_pro_val]": 503, + "[mMLM(PAIR)]": 517, + "[mMLM]": 493, + "[mPGLM_smi_pro(PAIR)]": 531, + "[mPGLM_smi_pro]": 507, + "[mPGLM_smi_val(PAIR)]": 532, + "[mPGLM_smi_val]": 508, + "[mPLM(PAIR)]": 520, + "[mPLM]": 496, + "[mPPLM(PAIR)]": 523, + "[mPPLM]": 499, + "[mPPM(PAIR)]": 534, + "[mPPM]": 510, + "[sGLM_pro(PAIR)]": 525, + "[sGLM_pro]": 501, + "[sGLM_smi(PAIR)]": 524, + "[sGLM_smi]": 500, + "[sGLM_val(PAIR)]": 526, + "[sGLM_val]": 502, + "[sMLM_pro(PAIR)]": 515, + "[sMLM_pro]": 491, + "[sMLM_smi(PAIR)]": 514, + "[sMLM_smi]": 490, + "[sMLM_val(PAIR)]": 516, + "[sMLM_val]": 492, + "[sPGLM_pro(PAIR)]": 529, + "[sPGLM_pro]": 505, + "[sPGLM_smi(PAIR)]": 528, + "[sPGLM_smi]": 504, + "[sPGLM_val(PAIR)]": 530, + "[sPGLM_val]": 506, + "[sPLM_pro_val(PAIR)]": 519, + "[sPLM_pro_val]": 495, + "[sPLM_smi(PAIR)]": 518, + "[sPLM_smi]": 494, + "[sPPLM_pro_val(PAIR)]": 522, + "[sPPLM_pro_val]": 498, + "[sPPLM_smi(PAIR)]": 521, + "[sPPLM_smi]": 497, + "[sPPM(PAIR)]": 533, + "[sPPM]": 509 +} diff --git a/config.json b/config.json new file mode 100644 index 0000000..cded515 --- /dev/null +++ b/config.json @@ -0,0 +1,33 @@ +{ + "_name_or_path": "./bertModel/cus-llama2-base", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 1, + "decoder_start_token_id": 1, + "eos_token_id": 2, + "forced_eos_token_id": 2, + "hidden_act": "silu", + "hidden_size": 768, + "initializer_range": 0.02, + "intermediate_size": 2560, + "mask_token_id": 4, + "max_position_embeddings": 4096, + "model_type": "llama", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "num_key_value_heads": 12, + "pad_token_id": 0, + "position_encoding_2d": false, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 5000000.0, + "tie_word_embeddings": false, + "torch_dtype": "float32", + "transformers_version": "4.38.2", + "use_cache": true, + "vocab_size": 851 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..1de33b9 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,12 @@ +{ + "bos_token_id": 1, + "decoder_start_token_id": 1, + "eos_token_id": 2, + "forced_eos_token_id": 2, + "length_penalty": 0, + "mask_token_id": 4, + "no_repeat_ngram_size": 9, + "num_beams": 3, + "pad_token_id": 0, + "transformers_version": "4.38.2" +} diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..79b54ed --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40dcda5fb361c0533b07393d71d940be41792a1ff96ebeed89bf4ba2ef503d24 +size 401679328 diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..a8b3208 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,7 @@ +{ + "cls_token": "[CLS]", + "mask_token": "[MASK]", + "pad_token": "[PAD]", + "sep_token": "[SEP]", + "unk_token": "[UNK]" +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..2f7187e --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,7275 @@ +{ + "version": "1.0", + "truncation": null, + "padding": null, + "added_tokens": [ + { + "id": 0, + "content": "[PAD]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 1, + "content": "[SOS]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 2, + "content": "[EOS]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 3, + "content": "[UNK]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 4, + "content": "[MASK]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 9, + "content": "-", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 10, + "content": ".", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 12, + "content": "0", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 13, + "content": "1", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 14, + "content": "2", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 15, + "content": "3", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 16, + "content": "4", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 17, + "content": "5", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 18, + "content": "6", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 19, + "content": "7", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 20, + "content": "8", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 21, + "content": "9", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 71, + "content": "[QM9:A_RC]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 72, + "content": "[QM9:B_RC]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 73, + "content": "[QM9:C_RC]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 74, + "content": "[QM9:miu_DM]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 75, + "content": "[QM9:alpha_IP]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 76, + "content": "[QM9:epsE_HOMO]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 77, + "content": "[QM9:epsE_LUMO]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 78, + "content": "[QM9:eps_GAP]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 79, + "content": "[QM9:R2_ESE]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 80, + "content": "[QM9:zpve_ZPVE]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 81, + "content": "[QM9:Uo_IEat0K]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 82, + "content": "[QM9:U_IEat298.15K]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 83, + "content": "[QM9:H_Eat298.15K]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 84, + "content": "[QM9:G_FEat298.15K]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 85, + "content": "[QM9:Cv_HCat298.15K]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 86, + "content": "[RDKit:FractionCSP3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 87, + "content": "[RDKit:HeavyAtomCount]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 88, + "content": "[RDKit:NHOHCount]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 89, + "content": "[RDKit:NOCount]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 90, + "content": "[RDKit:NumAliphaticCarbocycles]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 91, + "content": "[RDKit:NumAliphaticHeterocycles]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 92, + "content": "[RDKit:NumAliphaticRings]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 93, + "content": "[RDKit:NumAromaticCarbocycles]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 94, + "content": "[RDKit:NumAromaticHeterocycles]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 95, + "content": "[RDKit:NumAromaticRings]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 96, + "content": "[RDKit:NumHAcceptors]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 97, + "content": "[RDKit:NumHDonors]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 98, + "content": "[RDKit:NumHeteroatoms]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 99, + "content": "[RDKit:NumRotatableBonds]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 100, + "content": "[RDKit:NumSaturatedCarbocycles]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 101, + "content": "[RDKit:NumSaturatedHeterocycles]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 102, + "content": "[RDKit:NumSaturatedRings]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 103, + "content": "[RDKit:RingCount]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 104, + "content": "[RDKit:AUTOCORR2D_1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 105, + "content": "[RDKit:AUTOCORR2D_10]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 106, + "content": "[RDKit:AUTOCORR2D_100]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 107, + "content": "[RDKit:AUTOCORR2D_101]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 108, + "content": "[RDKit:AUTOCORR2D_102]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 109, + "content": "[RDKit:AUTOCORR2D_103]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 110, + "content": "[RDKit:AUTOCORR2D_104]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 111, + "content": "[RDKit:AUTOCORR2D_105]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 112, + "content": "[RDKit:AUTOCORR2D_106]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 113, + "content": "[RDKit:AUTOCORR2D_107]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 114, + "content": "[RDKit:AUTOCORR2D_108]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 115, + "content": "[RDKit:AUTOCORR2D_109]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 116, + "content": "[RDKit:AUTOCORR2D_11]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 117, + "content": "[RDKit:AUTOCORR2D_110]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 118, + "content": "[RDKit:AUTOCORR2D_111]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 119, + "content": "[RDKit:AUTOCORR2D_112]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 120, + "content": "[RDKit:AUTOCORR2D_113]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 121, + "content": "[RDKit:AUTOCORR2D_114]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 122, + "content": "[RDKit:AUTOCORR2D_115]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 123, + "content": "[RDKit:AUTOCORR2D_116]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 124, + "content": "[RDKit:AUTOCORR2D_117]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 125, + "content": "[RDKit:AUTOCORR2D_118]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 126, + "content": "[RDKit:AUTOCORR2D_119]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 127, + "content": "[RDKit:AUTOCORR2D_12]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 128, + "content": "[RDKit:AUTOCORR2D_120]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 129, + "content": "[RDKit:AUTOCORR2D_121]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 130, + "content": "[RDKit:AUTOCORR2D_122]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 131, + "content": "[RDKit:AUTOCORR2D_123]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 132, + "content": "[RDKit:AUTOCORR2D_124]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 133, + "content": "[RDKit:AUTOCORR2D_125]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 134, + "content": "[RDKit:AUTOCORR2D_126]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 135, + "content": "[RDKit:AUTOCORR2D_127]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 136, + "content": "[RDKit:AUTOCORR2D_128]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 137, + "content": "[RDKit:AUTOCORR2D_129]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 138, + "content": "[RDKit:AUTOCORR2D_13]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 139, + "content": "[RDKit:AUTOCORR2D_130]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 140, + "content": "[RDKit:AUTOCORR2D_131]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 141, + "content": "[RDKit:AUTOCORR2D_132]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 142, + "content": "[RDKit:AUTOCORR2D_133]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 143, + "content": "[RDKit:AUTOCORR2D_134]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 144, + "content": "[RDKit:AUTOCORR2D_135]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 145, + "content": "[RDKit:AUTOCORR2D_136]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 146, + "content": "[RDKit:AUTOCORR2D_137]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 147, + "content": "[RDKit:AUTOCORR2D_138]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 148, + "content": "[RDKit:AUTOCORR2D_139]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 149, + "content": "[RDKit:AUTOCORR2D_14]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 150, + "content": "[RDKit:AUTOCORR2D_140]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 151, + "content": "[RDKit:AUTOCORR2D_141]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 152, + "content": "[RDKit:AUTOCORR2D_142]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 153, + "content": "[RDKit:AUTOCORR2D_143]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 154, + "content": "[RDKit:AUTOCORR2D_144]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 155, + "content": "[RDKit:AUTOCORR2D_145]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 156, + "content": "[RDKit:AUTOCORR2D_146]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 157, + "content": "[RDKit:AUTOCORR2D_147]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 158, + "content": "[RDKit:AUTOCORR2D_148]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 159, + "content": "[RDKit:AUTOCORR2D_149]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 160, + "content": "[RDKit:AUTOCORR2D_15]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 161, + "content": "[RDKit:AUTOCORR2D_150]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 162, + "content": "[RDKit:AUTOCORR2D_151]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 163, + "content": "[RDKit:AUTOCORR2D_152]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 164, + "content": "[RDKit:AUTOCORR2D_153]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 165, + "content": "[RDKit:AUTOCORR2D_154]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 166, + "content": "[RDKit:AUTOCORR2D_155]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 167, + "content": "[RDKit:AUTOCORR2D_156]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 168, + "content": "[RDKit:AUTOCORR2D_157]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 169, + "content": "[RDKit:AUTOCORR2D_158]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 170, + "content": "[RDKit:AUTOCORR2D_159]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 171, + "content": "[RDKit:AUTOCORR2D_16]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 172, + "content": "[RDKit:AUTOCORR2D_160]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 173, + "content": "[RDKit:AUTOCORR2D_161]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 174, + "content": "[RDKit:AUTOCORR2D_162]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 175, + "content": "[RDKit:AUTOCORR2D_163]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 176, + "content": "[RDKit:AUTOCORR2D_164]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 177, + "content": "[RDKit:AUTOCORR2D_165]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 178, + "content": "[RDKit:AUTOCORR2D_166]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 179, + "content": "[RDKit:AUTOCORR2D_167]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 180, + "content": "[RDKit:AUTOCORR2D_168]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 181, + "content": "[RDKit:AUTOCORR2D_169]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 182, + "content": "[RDKit:AUTOCORR2D_17]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 183, + "content": "[RDKit:AUTOCORR2D_170]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 184, + "content": "[RDKit:AUTOCORR2D_171]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 185, + "content": "[RDKit:AUTOCORR2D_172]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 186, + "content": "[RDKit:AUTOCORR2D_173]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 187, + "content": "[RDKit:AUTOCORR2D_174]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 188, + "content": "[RDKit:AUTOCORR2D_175]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 189, + "content": "[RDKit:AUTOCORR2D_176]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 190, + "content": "[RDKit:AUTOCORR2D_177]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 191, + "content": "[RDKit:AUTOCORR2D_178]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 192, + "content": "[RDKit:AUTOCORR2D_179]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 193, + "content": "[RDKit:AUTOCORR2D_18]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 194, + "content": "[RDKit:AUTOCORR2D_180]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 195, + "content": "[RDKit:AUTOCORR2D_181]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 196, + "content": "[RDKit:AUTOCORR2D_182]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 197, + "content": "[RDKit:AUTOCORR2D_183]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 198, + "content": "[RDKit:AUTOCORR2D_184]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 199, + "content": "[RDKit:AUTOCORR2D_185]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 200, + "content": "[RDKit:AUTOCORR2D_186]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 201, + "content": "[RDKit:AUTOCORR2D_187]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 202, + "content": "[RDKit:AUTOCORR2D_188]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 203, + "content": "[RDKit:AUTOCORR2D_189]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 204, + "content": "[RDKit:AUTOCORR2D_19]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 205, + "content": "[RDKit:AUTOCORR2D_190]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 206, + "content": "[RDKit:AUTOCORR2D_191]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 207, + "content": "[RDKit:AUTOCORR2D_192]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 208, + "content": "[RDKit:AUTOCORR2D_2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 209, + "content": "[RDKit:AUTOCORR2D_20]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 210, + "content": "[RDKit:AUTOCORR2D_21]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 211, + "content": "[RDKit:AUTOCORR2D_22]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 212, + "content": "[RDKit:AUTOCORR2D_23]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 213, + "content": "[RDKit:AUTOCORR2D_24]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 214, + "content": "[RDKit:AUTOCORR2D_25]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 215, + "content": "[RDKit:AUTOCORR2D_26]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 216, + "content": "[RDKit:AUTOCORR2D_27]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 217, + "content": "[RDKit:AUTOCORR2D_28]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 218, + "content": "[RDKit:AUTOCORR2D_29]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 219, + "content": "[RDKit:AUTOCORR2D_3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 220, + "content": "[RDKit:AUTOCORR2D_30]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 221, + "content": "[RDKit:AUTOCORR2D_31]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 222, + "content": "[RDKit:AUTOCORR2D_32]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 223, + "content": "[RDKit:AUTOCORR2D_33]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 224, + "content": "[RDKit:AUTOCORR2D_34]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 225, + "content": "[RDKit:AUTOCORR2D_35]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 226, + "content": "[RDKit:AUTOCORR2D_36]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 227, + "content": "[RDKit:AUTOCORR2D_37]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 228, + "content": "[RDKit:AUTOCORR2D_38]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 229, + "content": "[RDKit:AUTOCORR2D_39]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 230, + "content": "[RDKit:AUTOCORR2D_4]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 231, + "content": "[RDKit:AUTOCORR2D_40]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 232, + "content": "[RDKit:AUTOCORR2D_41]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 233, + "content": "[RDKit:AUTOCORR2D_42]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 234, + "content": "[RDKit:AUTOCORR2D_43]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 235, + "content": "[RDKit:AUTOCORR2D_44]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 236, + "content": "[RDKit:AUTOCORR2D_45]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 237, + "content": "[RDKit:AUTOCORR2D_46]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 238, + "content": "[RDKit:AUTOCORR2D_47]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 239, + "content": "[RDKit:AUTOCORR2D_48]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 240, + "content": "[RDKit:AUTOCORR2D_49]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 241, + "content": "[RDKit:AUTOCORR2D_5]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 242, + "content": "[RDKit:AUTOCORR2D_50]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 243, + "content": "[RDKit:AUTOCORR2D_51]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 244, + "content": "[RDKit:AUTOCORR2D_52]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 245, + "content": "[RDKit:AUTOCORR2D_53]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 246, + "content": "[RDKit:AUTOCORR2D_54]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 247, + "content": "[RDKit:AUTOCORR2D_55]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 248, + "content": "[RDKit:AUTOCORR2D_56]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 249, + "content": "[RDKit:AUTOCORR2D_57]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 250, + "content": "[RDKit:AUTOCORR2D_58]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 251, + "content": "[RDKit:AUTOCORR2D_59]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 252, + "content": "[RDKit:AUTOCORR2D_6]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 253, + "content": "[RDKit:AUTOCORR2D_60]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 254, + "content": "[RDKit:AUTOCORR2D_61]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 255, + "content": "[RDKit:AUTOCORR2D_62]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 256, + "content": "[RDKit:AUTOCORR2D_63]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 257, + "content": "[RDKit:AUTOCORR2D_64]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 258, + "content": "[RDKit:AUTOCORR2D_65]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 259, + "content": "[RDKit:AUTOCORR2D_66]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 260, + "content": "[RDKit:AUTOCORR2D_67]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 261, + "content": "[RDKit:AUTOCORR2D_68]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 262, + "content": "[RDKit:AUTOCORR2D_69]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 263, + "content": "[RDKit:AUTOCORR2D_7]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 264, + "content": "[RDKit:AUTOCORR2D_70]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 265, + "content": "[RDKit:AUTOCORR2D_71]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 266, + "content": "[RDKit:AUTOCORR2D_72]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 267, + "content": "[RDKit:AUTOCORR2D_73]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 268, + "content": "[RDKit:AUTOCORR2D_74]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 269, + "content": "[RDKit:AUTOCORR2D_75]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 270, + "content": "[RDKit:AUTOCORR2D_76]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 271, + "content": "[RDKit:AUTOCORR2D_77]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 272, + "content": "[RDKit:AUTOCORR2D_78]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 273, + "content": "[RDKit:AUTOCORR2D_79]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 274, + "content": "[RDKit:AUTOCORR2D_8]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 275, + "content": "[RDKit:AUTOCORR2D_80]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 276, + "content": "[RDKit:AUTOCORR2D_81]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 277, + "content": "[RDKit:AUTOCORR2D_82]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 278, + "content": "[RDKit:AUTOCORR2D_83]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 279, + "content": "[RDKit:AUTOCORR2D_84]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 280, + "content": "[RDKit:AUTOCORR2D_85]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 281, + "content": "[RDKit:AUTOCORR2D_86]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 282, + "content": "[RDKit:AUTOCORR2D_87]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 283, + "content": "[RDKit:AUTOCORR2D_88]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 284, + "content": "[RDKit:AUTOCORR2D_89]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 285, + "content": "[RDKit:AUTOCORR2D_9]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 286, + "content": "[RDKit:AUTOCORR2D_90]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 287, + "content": "[RDKit:AUTOCORR2D_91]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 288, + "content": "[RDKit:AUTOCORR2D_92]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 289, + "content": "[RDKit:AUTOCORR2D_93]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 290, + "content": "[RDKit:AUTOCORR2D_94]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 291, + "content": "[RDKit:AUTOCORR2D_95]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 292, + "content": "[RDKit:AUTOCORR2D_96]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 293, + "content": "[RDKit:AUTOCORR2D_97]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 294, + "content": "[RDKit:AUTOCORR2D_98]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 295, + "content": "[RDKit:AUTOCORR2D_99]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 296, + "content": "[RDKit:AvgIpc]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 297, + "content": "[RDKit:BCUT2D_CHGHI]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 298, + "content": "[RDKit:BCUT2D_CHGLO]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 299, + "content": "[RDKit:BCUT2D_LOGPHI]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 300, + "content": "[RDKit:BCUT2D_LOGPLOW]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 301, + "content": "[RDKit:BCUT2D_MRHI]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 302, + "content": "[RDKit:BCUT2D_MRLOW]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 303, + "content": "[RDKit:BCUT2D_MWHI]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 304, + "content": "[RDKit:BCUT2D_MWLOW]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 305, + "content": "[RDKit:BalabanJ]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 306, + "content": "[RDKit:BertzCT]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 307, + "content": "[RDKit:Chi0]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 308, + "content": "[RDKit:Chi0n]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 309, + "content": "[RDKit:Chi0v]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 310, + "content": "[RDKit:Chi1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 311, + "content": "[RDKit:Chi1n]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 312, + "content": "[RDKit:Chi1v]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 313, + "content": "[RDKit:Chi2n]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 314, + "content": "[RDKit:Chi2v]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 315, + "content": "[RDKit:Chi3n]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 316, + "content": "[RDKit:Chi3v]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 317, + "content": "[RDKit:Chi4n]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 318, + "content": "[RDKit:Chi4v]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 319, + "content": "[RDKit:EState_VSA1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 320, + "content": "[RDKit:EState_VSA10]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 321, + "content": "[RDKit:EState_VSA11]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 322, + "content": "[RDKit:EState_VSA2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 323, + "content": "[RDKit:EState_VSA3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 324, + "content": "[RDKit:EState_VSA4]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 325, + "content": "[RDKit:EState_VSA5]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 326, + "content": "[RDKit:EState_VSA6]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 327, + "content": "[RDKit:EState_VSA7]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 328, + "content": "[RDKit:EState_VSA8]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 329, + "content": "[RDKit:EState_VSA9]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 330, + "content": "[RDKit:ExactMolWt]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 331, + "content": "[RDKit:FpDensityMorgan1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 332, + "content": "[RDKit:FpDensityMorgan2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 333, + "content": "[RDKit:FpDensityMorgan3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 334, + "content": "[RDKit:HallKierAlpha]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 335, + "content": "[RDKit:HeavyAtomMolWt]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 336, + "content": "[RDKit:Ipc]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 337, + "content": "[RDKit:Kappa1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 338, + "content": "[RDKit:Kappa2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 339, + "content": "[RDKit:Kappa3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 340, + "content": "[RDKit:LabuteASA]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 341, + "content": "[RDKit:MaxAbsEStateIndex]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 342, + "content": "[RDKit:MaxAbsPartialCharge]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 343, + "content": "[RDKit:MaxEStateIndex]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 344, + "content": "[RDKit:MaxPartialCharge]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 345, + "content": "[RDKit:MinAbsEStateIndex]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 346, + "content": "[RDKit:MinAbsPartialCharge]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 347, + "content": "[RDKit:MinEStateIndex]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 348, + "content": "[RDKit:MinPartialCharge]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 349, + "content": "[RDKit:MolLogP]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 350, + "content": "[RDKit:MolMR]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 351, + "content": "[RDKit:MolWt]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 352, + "content": "[RDKit:NumRadicalElectrons]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 353, + "content": "[RDKit:NumValenceElectrons]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 354, + "content": "[RDKit:PEOE_VSA1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 355, + "content": "[RDKit:PEOE_VSA10]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 356, + "content": "[RDKit:PEOE_VSA11]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 357, + "content": "[RDKit:PEOE_VSA12]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 358, + "content": "[RDKit:PEOE_VSA13]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 359, + "content": "[RDKit:PEOE_VSA14]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 360, + "content": "[RDKit:PEOE_VSA2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 361, + "content": "[RDKit:PEOE_VSA3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 362, + "content": "[RDKit:PEOE_VSA4]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 363, + "content": "[RDKit:PEOE_VSA5]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 364, + "content": "[RDKit:PEOE_VSA6]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 365, + "content": "[RDKit:PEOE_VSA7]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 366, + "content": "[RDKit:PEOE_VSA8]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 367, + "content": "[RDKit:PEOE_VSA9]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 368, + "content": "[RDKit:SMR_VSA1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 369, + "content": "[RDKit:SMR_VSA10]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 370, + "content": "[RDKit:SMR_VSA2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 371, + "content": "[RDKit:SMR_VSA3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 372, + "content": "[RDKit:SMR_VSA4]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 373, + "content": "[RDKit:SMR_VSA5]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 374, + "content": "[RDKit:SMR_VSA6]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 375, + "content": "[RDKit:SMR_VSA7]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 376, + "content": "[RDKit:SMR_VSA8]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 377, + "content": "[RDKit:SMR_VSA9]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 378, + "content": "[RDKit:SPS]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 379, + "content": "[RDKit:SlogP_VSA1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 380, + "content": "[RDKit:SlogP_VSA10]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 381, + "content": "[RDKit:SlogP_VSA11]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 382, + "content": "[RDKit:SlogP_VSA12]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 383, + "content": "[RDKit:SlogP_VSA2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 384, + "content": "[RDKit:SlogP_VSA3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 385, + "content": "[RDKit:SlogP_VSA4]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 386, + "content": "[RDKit:SlogP_VSA5]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 387, + "content": "[RDKit:SlogP_VSA6]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 388, + "content": "[RDKit:SlogP_VSA7]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 389, + "content": "[RDKit:SlogP_VSA8]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 390, + "content": "[RDKit:SlogP_VSA9]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 391, + "content": "[RDKit:TPSA]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 392, + "content": "[RDKit:VSA_EState1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 393, + "content": "[RDKit:VSA_EState10]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 394, + "content": "[RDKit:VSA_EState2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 395, + "content": "[RDKit:VSA_EState3]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 396, + "content": "[RDKit:VSA_EState4]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 397, + "content": "[RDKit:VSA_EState5]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 398, + "content": "[RDKit:VSA_EState6]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 399, + "content": "[RDKit:VSA_EState7]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 400, + "content": "[RDKit:VSA_EState8]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 401, + "content": "[RDKit:VSA_EState9]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 402, + "content": "[RDKit:fr_Al_COO]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 403, + "content": "[RDKit:fr_Al_OH]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 404, + "content": "[RDKit:fr_Al_OH_noTert]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 405, + "content": "[RDKit:fr_ArN]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 406, + "content": "[RDKit:fr_Ar_COO]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 407, + "content": "[RDKit:fr_Ar_N]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 408, + "content": "[RDKit:fr_Ar_NH]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 409, + "content": "[RDKit:fr_Ar_OH]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 410, + "content": "[RDKit:fr_COO]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 411, + "content": "[RDKit:fr_COO2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 412, + "content": "[RDKit:fr_C_O]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 413, + "content": "[RDKit:fr_C_O_noCOO]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 414, + "content": "[RDKit:fr_C_S]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 415, + "content": "[RDKit:fr_HOCCN]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 416, + "content": "[RDKit:fr_Imine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 417, + "content": "[RDKit:fr_NH0]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 418, + "content": "[RDKit:fr_NH1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 419, + "content": "[RDKit:fr_NH2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 420, + "content": "[RDKit:fr_N_O]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 421, + "content": "[RDKit:fr_Ndealkylation1]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 422, + "content": "[RDKit:fr_Ndealkylation2]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 423, + "content": "[RDKit:fr_Nhpyrrole]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 424, + "content": "[RDKit:fr_SH]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 425, + "content": "[RDKit:fr_aldehyde]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 426, + "content": "[RDKit:fr_alkyl_carbamate]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 427, + "content": "[RDKit:fr_alkyl_halide]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 428, + "content": "[RDKit:fr_allylic_oxid]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 429, + "content": "[RDKit:fr_amide]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 430, + "content": "[RDKit:fr_amidine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 431, + "content": "[RDKit:fr_aniline]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 432, + "content": "[RDKit:fr_aryl_methyl]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 433, + "content": "[RDKit:fr_azide]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 434, + "content": "[RDKit:fr_azo]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 435, + "content": "[RDKit:fr_barbitur]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 436, + "content": "[RDKit:fr_benzene]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 437, + "content": "[RDKit:fr_benzodiazepine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 438, + "content": "[RDKit:fr_bicyclic]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 439, + "content": "[RDKit:fr_diazo]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 440, + "content": "[RDKit:fr_dihydropyridine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 441, + "content": "[RDKit:fr_epoxide]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 442, + "content": "[RDKit:fr_ester]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 443, + "content": "[RDKit:fr_ether]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 444, + "content": "[RDKit:fr_furan]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 445, + "content": "[RDKit:fr_guanido]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 446, + "content": "[RDKit:fr_halogen]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 447, + "content": "[RDKit:fr_hdrzine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 448, + "content": "[RDKit:fr_hdrzone]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 449, + "content": "[RDKit:fr_imidazole]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 450, + "content": "[RDKit:fr_imide]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 451, + "content": "[RDKit:fr_isocyan]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 452, + "content": "[RDKit:fr_isothiocyan]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 453, + "content": "[RDKit:fr_ketone]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 454, + "content": "[RDKit:fr_ketone_Topliss]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 455, + "content": "[RDKit:fr_lactam]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 456, + "content": "[RDKit:fr_lactone]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 457, + "content": "[RDKit:fr_methoxy]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 458, + "content": "[RDKit:fr_morpholine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 459, + "content": "[RDKit:fr_nitrile]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 460, + "content": "[RDKit:fr_nitro]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 461, + "content": "[RDKit:fr_nitro_arom]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 462, + "content": "[RDKit:fr_nitro_arom_nonortho]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 463, + "content": "[RDKit:fr_nitroso]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 464, + "content": "[RDKit:fr_oxazole]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 465, + "content": "[RDKit:fr_oxime]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 466, + "content": "[RDKit:fr_para_hydroxylation]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 467, + "content": "[RDKit:fr_phenol]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 468, + "content": "[RDKit:fr_phenol_noOrthoHbond]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 469, + "content": "[RDKit:fr_phos_acid]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 470, + "content": "[RDKit:fr_phos_ester]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 471, + "content": "[RDKit:fr_piperdine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 472, + "content": "[RDKit:fr_piperzine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 473, + "content": "[RDKit:fr_priamide]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 474, + "content": "[RDKit:fr_prisulfonamd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 475, + "content": "[RDKit:fr_pyridine]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 476, + "content": "[RDKit:fr_quatN]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 477, + "content": "[RDKit:fr_sulfide]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 478, + "content": "[RDKit:fr_sulfonamd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 479, + "content": "[RDKit:fr_sulfone]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 480, + "content": "[RDKit:fr_term_acetylene]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 481, + "content": "[RDKit:fr_tetrazole]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 482, + "content": "[RDKit:fr_thiazole]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 483, + "content": "[RDKit:fr_thiocyan]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 484, + "content": "[RDKit:fr_thiophene]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 485, + "content": "[RDKit:fr_unbrch_alkane]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 486, + "content": "[RDKit:fr_urea]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 487, + "content": "[RDKit:qed]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 488, + "content": ";", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 489, + "content": ",", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 490, + "content": "[sMLM_smi]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 491, + "content": "[sMLM_pro]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 492, + "content": "[sMLM_val]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 493, + "content": "[mMLM]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 494, + "content": "[sPLM_smi]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 495, + "content": "[sPLM_pro_val]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 496, + "content": "[mPLM]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 497, + "content": "[sPPLM_smi]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 498, + "content": "[sPPLM_pro_val]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 499, + "content": "[mPPLM]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 500, + "content": "[sGLM_smi]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 501, + "content": "[sGLM_pro]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 502, + "content": "[sGLM_val]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 503, + "content": "[mGLM_pro_val]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 504, + "content": "[sPGLM_smi]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 505, + "content": "[sPGLM_pro]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 506, + "content": "[sPGLM_val]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 507, + "content": "[mPGLM_smi_pro]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 508, + "content": "[mPGLM_smi_val]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 509, + "content": "[sPPM]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 510, + "content": "[mPPM]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 511, + "content": "[SPM_DDD]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 512, + "content": "[SPM_AAD]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 513, + "content": "[SPM_XYZ]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 514, + "content": "[sMLM_smi(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 515, + "content": "[sMLM_pro(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 516, + "content": "[sMLM_val(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 517, + "content": "[mMLM(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 518, + "content": "[sPLM_smi(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 519, + "content": "[sPLM_pro_val(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 520, + "content": "[mPLM(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 521, + "content": "[sPPLM_smi(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 522, + "content": "[sPPLM_pro_val(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 523, + "content": "[mPPLM(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 524, + "content": "[sGLM_smi(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 525, + "content": "[sGLM_pro(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 526, + "content": "[sGLM_val(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 527, + "content": "[mGLM_pro_val(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 528, + "content": "[sPGLM_smi(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 529, + "content": "[sPGLM_pro(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 530, + "content": "[sPGLM_val(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 531, + "content": "[mPGLM_smi_pro(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 532, + "content": "[mPGLM_smi_val(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 533, + "content": "[sPPM(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 534, + "content": "[mPPM(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 535, + "content": "[SPM_DDD(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 536, + "content": "[SPM_AAD(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 537, + "content": "[SPM_XYZ(PAIR)]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 538, + "content": "[(DDD)ATOM:Ac]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 539, + "content": "[(DDD)ATOM:Ag]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 540, + "content": "[(DDD)ATOM:Al]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 541, + "content": "[(DDD)ATOM:Am]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 542, + "content": "[(DDD)ATOM:Ar]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 543, + "content": "[(DDD)ATOM:As]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 544, + "content": "[(DDD)ATOM:At]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 545, + "content": "[(DDD)ATOM:Au]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 546, + "content": "[(DDD)ATOM:B]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 547, + "content": "[(DDD)ATOM:Ba]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 548, + "content": "[(DDD)ATOM:Be]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 549, + "content": "[(DDD)ATOM:Bi]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 550, + "content": "[(DDD)ATOM:Bk]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 551, + "content": "[(DDD)ATOM:Br]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 552, + "content": "[(DDD)ATOM:C]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 553, + "content": "[(DDD)ATOM:Ca]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 554, + "content": "[(DDD)ATOM:Cd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 555, + "content": "[(DDD)ATOM:Ce]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 556, + "content": "[(DDD)ATOM:Cf]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 557, + "content": "[(DDD)ATOM:Cl]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 558, + "content": "[(DDD)ATOM:Cm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 559, + "content": "[(DDD)ATOM:Co]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 560, + "content": "[(DDD)ATOM:Cr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 561, + "content": "[(DDD)ATOM:Cs]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 562, + "content": "[(DDD)ATOM:Cu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 563, + "content": "[(DDD)ATOM:Dy]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 564, + "content": "[(DDD)ATOM:Er]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 565, + "content": "[(DDD)ATOM:Es]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 566, + "content": "[(DDD)ATOM:Eu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 567, + "content": "[(DDD)ATOM:F]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 568, + "content": "[(DDD)ATOM:Fe]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 569, + "content": "[(DDD)ATOM:Fm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 570, + "content": "[(DDD)ATOM:Ga]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 571, + "content": "[(DDD)ATOM:Gd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 572, + "content": "[(DDD)ATOM:Ge]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 573, + "content": "[(DDD)ATOM:He]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 574, + "content": "[(DDD)ATOM:Hf]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 575, + "content": "[(DDD)ATOM:Hg]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 576, + "content": "[(DDD)ATOM:Ho]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 577, + "content": "[(DDD)ATOM:I]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 578, + "content": "[(DDD)ATOM:In]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 579, + "content": "[(DDD)ATOM:Ir]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 580, + "content": "[(DDD)ATOM:K]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 581, + "content": "[(DDD)ATOM:Kr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 582, + "content": "[(DDD)ATOM:La]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 583, + "content": "[(DDD)ATOM:Li]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 584, + "content": "[(DDD)ATOM:Lr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 585, + "content": "[(DDD)ATOM:Lu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 586, + "content": "[(DDD)ATOM:Md]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 587, + "content": "[(DDD)ATOM:Mg]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 588, + "content": "[(DDD)ATOM:Mn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 589, + "content": "[(DDD)ATOM:Mo]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 590, + "content": "[(DDD)ATOM:N]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 591, + "content": "[(DDD)ATOM:Na]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 592, + "content": "[(DDD)ATOM:Nb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 593, + "content": "[(DDD)ATOM:Nd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 594, + "content": "[(DDD)ATOM:Ne]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 595, + "content": "[(DDD)ATOM:Ni]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 596, + "content": "[(DDD)ATOM:No]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 597, + "content": "[(DDD)ATOM:Np]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 598, + "content": "[(DDD)ATOM:O]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 599, + "content": "[(DDD)ATOM:Os]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 600, + "content": "[(DDD)ATOM:P]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 601, + "content": "[(DDD)ATOM:Pa]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 602, + "content": "[(DDD)ATOM:Pb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 603, + "content": "[(DDD)ATOM:Pd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 604, + "content": "[(DDD)ATOM:Pm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 605, + "content": "[(DDD)ATOM:Po]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 606, + "content": "[(DDD)ATOM:Pr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 607, + "content": "[(DDD)ATOM:Pt]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 608, + "content": "[(DDD)ATOM:Pu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 609, + "content": "[(DDD)ATOM:Rb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 610, + "content": "[(DDD)ATOM:Re]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 611, + "content": "[(DDD)ATOM:Rh]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 612, + "content": "[(DDD)ATOM:Rn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 613, + "content": "[(DDD)ATOM:Ru]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 614, + "content": "[(DDD)ATOM:S]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 615, + "content": "[(DDD)ATOM:Sb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 616, + "content": "[(DDD)ATOM:Sc]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 617, + "content": "[(DDD)ATOM:Se]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 618, + "content": "[(DDD)ATOM:Si]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 619, + "content": "[(DDD)ATOM:Sm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 620, + "content": "[(DDD)ATOM:Sn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 621, + "content": "[(DDD)ATOM:Sr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 622, + "content": "[(DDD)ATOM:Ta]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 623, + "content": "[(DDD)ATOM:Tb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 624, + "content": "[(DDD)ATOM:Tc]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 625, + "content": "[(DDD)ATOM:Te]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 626, + "content": "[(DDD)ATOM:Th]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 627, + "content": "[(DDD)ATOM:Ti]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 628, + "content": "[(DDD)ATOM:Tl]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 629, + "content": "[(DDD)ATOM:Tm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 630, + "content": "[(DDD)ATOM:U]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 631, + "content": "[(DDD)ATOM:V]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 632, + "content": "[(DDD)ATOM:W]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 633, + "content": "[(DDD)ATOM:Xe]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 634, + "content": "[(DDD)ATOM:Y]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 635, + "content": "[(DDD)ATOM:Yb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 636, + "content": "[(DDD)ATOM:Zn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 637, + "content": "[(DDD)ATOM:Zr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 638, + "content": "[(AAD)ATOM:Ac]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 639, + "content": "[(AAD)ATOM:Ag]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 640, + "content": "[(AAD)ATOM:Al]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 641, + "content": "[(AAD)ATOM:Am]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 642, + "content": "[(AAD)ATOM:Ar]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 643, + "content": "[(AAD)ATOM:As]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 644, + "content": "[(AAD)ATOM:At]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 645, + "content": "[(AAD)ATOM:Au]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 646, + "content": "[(AAD)ATOM:B]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 647, + "content": "[(AAD)ATOM:Ba]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 648, + "content": "[(AAD)ATOM:Be]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 649, + "content": "[(AAD)ATOM:Bi]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 650, + "content": "[(AAD)ATOM:Bk]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 651, + "content": "[(AAD)ATOM:Br]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 652, + "content": "[(AAD)ATOM:C]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 653, + "content": "[(AAD)ATOM:Ca]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 654, + "content": "[(AAD)ATOM:Cd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 655, + "content": "[(AAD)ATOM:Ce]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 656, + "content": "[(AAD)ATOM:Cf]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 657, + "content": "[(AAD)ATOM:Cl]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 658, + "content": "[(AAD)ATOM:Cm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 659, + "content": "[(AAD)ATOM:Co]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 660, + "content": "[(AAD)ATOM:Cr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 661, + "content": "[(AAD)ATOM:Cs]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 662, + "content": "[(AAD)ATOM:Cu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 663, + "content": "[(AAD)ATOM:Dy]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 664, + "content": "[(AAD)ATOM:Er]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 665, + "content": "[(AAD)ATOM:Es]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 666, + "content": "[(AAD)ATOM:Eu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 667, + "content": "[(AAD)ATOM:F]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 668, + "content": "[(AAD)ATOM:Fe]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 669, + "content": "[(AAD)ATOM:Fm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 670, + "content": "[(AAD)ATOM:Ga]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 671, + "content": "[(AAD)ATOM:Gd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 672, + "content": "[(AAD)ATOM:Ge]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 673, + "content": "[(AAD)ATOM:He]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 674, + "content": "[(AAD)ATOM:Hf]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 675, + "content": "[(AAD)ATOM:Hg]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 676, + "content": "[(AAD)ATOM:Ho]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 677, + "content": "[(AAD)ATOM:I]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 678, + "content": "[(AAD)ATOM:In]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 679, + "content": "[(AAD)ATOM:Ir]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 680, + "content": "[(AAD)ATOM:K]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 681, + "content": "[(AAD)ATOM:Kr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 682, + "content": "[(AAD)ATOM:La]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 683, + "content": "[(AAD)ATOM:Li]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 684, + "content": "[(AAD)ATOM:Lr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 685, + "content": "[(AAD)ATOM:Lu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 686, + "content": "[(AAD)ATOM:Md]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 687, + "content": "[(AAD)ATOM:Mg]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 688, + "content": "[(AAD)ATOM:Mn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 689, + "content": "[(AAD)ATOM:Mo]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 690, + "content": "[(AAD)ATOM:N]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 691, + "content": "[(AAD)ATOM:Na]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 692, + "content": "[(AAD)ATOM:Nb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 693, + "content": "[(AAD)ATOM:Nd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 694, + "content": "[(AAD)ATOM:Ne]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 695, + "content": "[(AAD)ATOM:Ni]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 696, + "content": "[(AAD)ATOM:No]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 697, + "content": "[(AAD)ATOM:Np]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 698, + "content": "[(AAD)ATOM:O]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 699, + "content": "[(AAD)ATOM:Os]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 700, + "content": "[(AAD)ATOM:P]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 701, + "content": "[(AAD)ATOM:Pa]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 702, + "content": "[(AAD)ATOM:Pb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 703, + "content": "[(AAD)ATOM:Pd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 704, + "content": "[(AAD)ATOM:Pm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 705, + "content": "[(AAD)ATOM:Po]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 706, + "content": "[(AAD)ATOM:Pr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 707, + "content": "[(AAD)ATOM:Pt]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 708, + "content": "[(AAD)ATOM:Pu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 709, + "content": "[(AAD)ATOM:Rb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 710, + "content": "[(AAD)ATOM:Re]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 711, + "content": "[(AAD)ATOM:Rh]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 712, + "content": "[(AAD)ATOM:Rn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 713, + "content": "[(AAD)ATOM:Ru]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 714, + "content": "[(AAD)ATOM:S]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 715, + "content": "[(AAD)ATOM:Sb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 716, + "content": "[(AAD)ATOM:Sc]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 717, + "content": "[(AAD)ATOM:Se]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 718, + "content": "[(AAD)ATOM:Si]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 719, + "content": "[(AAD)ATOM:Sm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 720, + "content": "[(AAD)ATOM:Sn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 721, + "content": "[(AAD)ATOM:Sr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 722, + "content": "[(AAD)ATOM:Ta]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 723, + "content": "[(AAD)ATOM:Tb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 724, + "content": "[(AAD)ATOM:Tc]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 725, + "content": "[(AAD)ATOM:Te]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 726, + "content": "[(AAD)ATOM:Th]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 727, + "content": "[(AAD)ATOM:Ti]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 728, + "content": "[(AAD)ATOM:Tl]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 729, + "content": "[(AAD)ATOM:Tm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 730, + "content": "[(AAD)ATOM:U]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 731, + "content": "[(AAD)ATOM:V]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 732, + "content": "[(AAD)ATOM:W]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 733, + "content": "[(AAD)ATOM:Xe]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 734, + "content": "[(AAD)ATOM:Y]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 735, + "content": "[(AAD)ATOM:Yb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 736, + "content": "[(AAD)ATOM:Zn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 737, + "content": "[(AAD)ATOM:Zr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 738, + "content": "[(XYZ)ATOM:Ac]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 739, + "content": "[(XYZ)ATOM:Ag]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 740, + "content": "[(XYZ)ATOM:Al]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 741, + "content": "[(XYZ)ATOM:Am]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 742, + "content": "[(XYZ)ATOM:Ar]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 743, + "content": "[(XYZ)ATOM:As]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 744, + "content": "[(XYZ)ATOM:At]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 745, + "content": "[(XYZ)ATOM:Au]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 746, + "content": "[(XYZ)ATOM:B]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 747, + "content": "[(XYZ)ATOM:Ba]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 748, + "content": "[(XYZ)ATOM:Be]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 749, + "content": "[(XYZ)ATOM:Bi]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 750, + "content": "[(XYZ)ATOM:Bk]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 751, + "content": "[(XYZ)ATOM:Br]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 752, + "content": "[(XYZ)ATOM:C]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 753, + "content": "[(XYZ)ATOM:Ca]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 754, + "content": "[(XYZ)ATOM:Cd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 755, + "content": "[(XYZ)ATOM:Ce]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 756, + "content": "[(XYZ)ATOM:Cf]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 757, + "content": "[(XYZ)ATOM:Cl]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 758, + "content": "[(XYZ)ATOM:Cm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 759, + "content": "[(XYZ)ATOM:Co]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 760, + "content": "[(XYZ)ATOM:Cr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 761, + "content": "[(XYZ)ATOM:Cs]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 762, + "content": "[(XYZ)ATOM:Cu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 763, + "content": "[(XYZ)ATOM:Dy]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 764, + "content": "[(XYZ)ATOM:Er]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 765, + "content": "[(XYZ)ATOM:Es]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 766, + "content": "[(XYZ)ATOM:Eu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 767, + "content": "[(XYZ)ATOM:F]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 768, + "content": "[(XYZ)ATOM:Fe]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 769, + "content": "[(XYZ)ATOM:Fm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 770, + "content": "[(XYZ)ATOM:Ga]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 771, + "content": "[(XYZ)ATOM:Gd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 772, + "content": "[(XYZ)ATOM:Ge]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 773, + "content": "[(XYZ)ATOM:He]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 774, + "content": "[(XYZ)ATOM:Hf]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 775, + "content": "[(XYZ)ATOM:Hg]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 776, + "content": "[(XYZ)ATOM:Ho]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 777, + "content": "[(XYZ)ATOM:I]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 778, + "content": "[(XYZ)ATOM:In]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 779, + "content": "[(XYZ)ATOM:Ir]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 780, + "content": "[(XYZ)ATOM:K]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 781, + "content": "[(XYZ)ATOM:Kr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 782, + "content": "[(XYZ)ATOM:La]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 783, + "content": "[(XYZ)ATOM:Li]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 784, + "content": "[(XYZ)ATOM:Lr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 785, + "content": "[(XYZ)ATOM:Lu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 786, + "content": "[(XYZ)ATOM:Md]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 787, + "content": "[(XYZ)ATOM:Mg]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 788, + "content": "[(XYZ)ATOM:Mn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 789, + "content": "[(XYZ)ATOM:Mo]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 790, + "content": "[(XYZ)ATOM:N]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 791, + "content": "[(XYZ)ATOM:Na]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 792, + "content": "[(XYZ)ATOM:Nb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 793, + "content": "[(XYZ)ATOM:Nd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 794, + "content": "[(XYZ)ATOM:Ne]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 795, + "content": "[(XYZ)ATOM:Ni]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 796, + "content": "[(XYZ)ATOM:No]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 797, + "content": "[(XYZ)ATOM:Np]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 798, + "content": "[(XYZ)ATOM:O]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 799, + "content": "[(XYZ)ATOM:Os]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 800, + "content": "[(XYZ)ATOM:P]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 801, + "content": "[(XYZ)ATOM:Pa]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 802, + "content": "[(XYZ)ATOM:Pb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 803, + "content": "[(XYZ)ATOM:Pd]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 804, + "content": "[(XYZ)ATOM:Pm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 805, + "content": "[(XYZ)ATOM:Po]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 806, + "content": "[(XYZ)ATOM:Pr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 807, + "content": "[(XYZ)ATOM:Pt]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 808, + "content": "[(XYZ)ATOM:Pu]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 809, + "content": "[(XYZ)ATOM:Rb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 810, + "content": "[(XYZ)ATOM:Re]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 811, + "content": "[(XYZ)ATOM:Rh]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 812, + "content": "[(XYZ)ATOM:Rn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 813, + "content": "[(XYZ)ATOM:Ru]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 814, + "content": "[(XYZ)ATOM:S]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 815, + "content": "[(XYZ)ATOM:Sb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 816, + "content": "[(XYZ)ATOM:Sc]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 817, + "content": "[(XYZ)ATOM:Se]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 818, + "content": "[(XYZ)ATOM:Si]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 819, + "content": "[(XYZ)ATOM:Sm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 820, + "content": "[(XYZ)ATOM:Sn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 821, + "content": "[(XYZ)ATOM:Sr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 822, + "content": "[(XYZ)ATOM:Ta]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 823, + "content": "[(XYZ)ATOM:Tb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 824, + "content": "[(XYZ)ATOM:Tc]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 825, + "content": "[(XYZ)ATOM:Te]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 826, + "content": "[(XYZ)ATOM:Th]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 827, + "content": "[(XYZ)ATOM:Ti]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 828, + "content": "[(XYZ)ATOM:Tl]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 829, + "content": "[(XYZ)ATOM:Tm]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 830, + "content": "[(XYZ)ATOM:U]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 831, + "content": "[(XYZ)ATOM:V]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 832, + "content": "[(XYZ)ATOM:W]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 833, + "content": "[(XYZ)ATOM:Xe]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 834, + "content": "[(XYZ)ATOM:Y]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 835, + "content": "[(XYZ)ATOM:Yb]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 836, + "content": "[(XYZ)ATOM:Zn]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 837, + "content": "[(XYZ)ATOM:Zr]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 838, + "content": "[FPR:MACCS]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 839, + "content": "[FPR:Toplogical]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 840, + "content": "[FPR:ECFP]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 841, + "content": "[FPR:FCFP]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 842, + "content": "[FPR:Avalon]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 843, + "content": "[SEP]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": true + }, + { + "id": 844, + "content": "[SPAN]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 845, + "content": "[VALUE]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 846, + "content": "[XYZ]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 847, + "content": "[BITS]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 848, + "content": "[CUSPRO]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 849, + "content": "[SUB]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": true, + "special": false + }, + { + "id": 850, + "content": "[CLS]", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + } + ], + "normalizer": { + "type": "BertNormalizer", + "clean_text": true, + "handle_chinese_chars": true, + "strip_accents": null, + "lowercase": false + }, + "pre_tokenizer": { + "type": "BertPreTokenizer" + }, + "post_processor": null, + "decoder": { + "type": "WordPiece", + "prefix": "##", + "cleanup": true + }, + "model": { + "type": "WordPiece", + "unk_token": "[UNK]", + "continuing_subword_prefix": "##", + "max_input_chars_per_word": 100, + "vocab": { + "[PAD]": 0, + "[SOS]": 1, + "[EOS]": 2, + "[UNK]": 3, + "[MASK]": 4, + "#": 5, + "(": 6, + ")": 7, + "+": 8, + "-": 9, + ".": 10, + "/": 11, + "0": 12, + "1": 13, + "2": 14, + "3": 15, + "4": 16, + "5": 17, + "6": 18, + "7": 19, + "8": 20, + "9": 21, + "=": 22, + "@": 23, + "A": 24, + "B": 25, + "C": 26, + "D": 27, + "E": 28, + "F": 29, + "G": 30, + "H": 31, + "I": 32, + "K": 33, + "L": 34, + "M": 35, + "N": 36, + "O": 37, + "P": 38, + "R": 39, + "S": 40, + "T": 41, + "U": 42, + "V": 43, + "W": 44, + "X": 45, + "Y": 46, + "Z": 47, + "[": 48, + "\\": 49, + "]": 50, + "a": 51, + "b": 52, + "c": 53, + "d": 54, + "e": 55, + "f": 56, + "g": 57, + "h": 58, + "i": 59, + "k": 60, + "l": 61, + "m": 62, + "n": 63, + "o": 64, + "p": 65, + "r": 66, + "s": 67, + "t": 68, + "u": 69, + "y": 70 + } + } +} \ No newline at end of file diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..0a84df5 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,6391 @@ +{ + "added_tokens_decoder": { + "0": { + "content": "[PAD]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "1": { + "content": "[SOS]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "2": { + "content": "[EOS]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "3": { + "content": "[UNK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "4": { + "content": "[MASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "9": { + "content": "-", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "10": { + "content": ".", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "12": { + "content": "0", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "13": { + "content": "1", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "14": { + "content": "2", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "15": { + "content": "3", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "16": { + "content": "4", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "17": { + "content": "5", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "18": { + "content": "6", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "19": { + "content": "7", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "20": { + "content": "8", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "21": { + "content": "9", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "71": { + "content": "[QM9:A_RC]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "72": { + "content": "[QM9:B_RC]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "73": { + "content": "[QM9:C_RC]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "74": { + "content": "[QM9:miu_DM]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "75": { + "content": "[QM9:alpha_IP]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "76": { + "content": "[QM9:epsE_HOMO]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "77": { + "content": "[QM9:epsE_LUMO]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "78": { + "content": "[QM9:eps_GAP]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "79": { + "content": "[QM9:R2_ESE]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "80": { + "content": "[QM9:zpve_ZPVE]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "81": { + "content": "[QM9:Uo_IEat0K]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "82": { + "content": "[QM9:U_IEat298.15K]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "83": { + "content": "[QM9:H_Eat298.15K]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "84": { + "content": "[QM9:G_FEat298.15K]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "85": { + "content": "[QM9:Cv_HCat298.15K]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "86": { + "content": "[RDKit:FractionCSP3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "87": { + "content": "[RDKit:HeavyAtomCount]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "88": { + "content": "[RDKit:NHOHCount]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "89": { + "content": "[RDKit:NOCount]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "90": { + "content": "[RDKit:NumAliphaticCarbocycles]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "91": { + "content": "[RDKit:NumAliphaticHeterocycles]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "92": { + "content": "[RDKit:NumAliphaticRings]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "93": { + "content": "[RDKit:NumAromaticCarbocycles]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "94": { + "content": "[RDKit:NumAromaticHeterocycles]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "95": { + "content": "[RDKit:NumAromaticRings]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "96": { + "content": "[RDKit:NumHAcceptors]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "97": { + "content": "[RDKit:NumHDonors]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "98": { + "content": "[RDKit:NumHeteroatoms]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "99": { + "content": "[RDKit:NumRotatableBonds]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "100": { + "content": "[RDKit:NumSaturatedCarbocycles]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "101": { + "content": "[RDKit:NumSaturatedHeterocycles]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "102": { + "content": "[RDKit:NumSaturatedRings]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "103": { + "content": "[RDKit:RingCount]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "104": { + "content": "[RDKit:AUTOCORR2D_1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "105": { + "content": "[RDKit:AUTOCORR2D_10]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "106": { + "content": "[RDKit:AUTOCORR2D_100]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "107": { + "content": "[RDKit:AUTOCORR2D_101]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "108": { + "content": "[RDKit:AUTOCORR2D_102]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "109": { + "content": "[RDKit:AUTOCORR2D_103]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "110": { + "content": "[RDKit:AUTOCORR2D_104]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "111": { + "content": "[RDKit:AUTOCORR2D_105]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "112": { + "content": "[RDKit:AUTOCORR2D_106]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "113": { + "content": "[RDKit:AUTOCORR2D_107]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "114": { + "content": "[RDKit:AUTOCORR2D_108]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "115": { + "content": "[RDKit:AUTOCORR2D_109]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "116": { + "content": "[RDKit:AUTOCORR2D_11]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "117": { + "content": "[RDKit:AUTOCORR2D_110]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "118": { + "content": "[RDKit:AUTOCORR2D_111]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "119": { + "content": "[RDKit:AUTOCORR2D_112]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "120": { + "content": "[RDKit:AUTOCORR2D_113]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "121": { + "content": "[RDKit:AUTOCORR2D_114]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "122": { + "content": "[RDKit:AUTOCORR2D_115]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "123": { + "content": "[RDKit:AUTOCORR2D_116]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "124": { + "content": "[RDKit:AUTOCORR2D_117]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "125": { + "content": "[RDKit:AUTOCORR2D_118]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "126": { + "content": "[RDKit:AUTOCORR2D_119]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "127": { + "content": "[RDKit:AUTOCORR2D_12]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "128": { + "content": "[RDKit:AUTOCORR2D_120]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "129": { + "content": "[RDKit:AUTOCORR2D_121]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "130": { + "content": "[RDKit:AUTOCORR2D_122]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "131": { + "content": "[RDKit:AUTOCORR2D_123]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "132": { + "content": "[RDKit:AUTOCORR2D_124]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "133": { + "content": "[RDKit:AUTOCORR2D_125]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "134": { + "content": "[RDKit:AUTOCORR2D_126]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "135": { + "content": "[RDKit:AUTOCORR2D_127]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "136": { + "content": "[RDKit:AUTOCORR2D_128]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "137": { + "content": "[RDKit:AUTOCORR2D_129]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "138": { + "content": "[RDKit:AUTOCORR2D_13]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "139": { + "content": "[RDKit:AUTOCORR2D_130]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "140": { + "content": "[RDKit:AUTOCORR2D_131]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "141": { + "content": "[RDKit:AUTOCORR2D_132]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "142": { + "content": "[RDKit:AUTOCORR2D_133]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "143": { + "content": "[RDKit:AUTOCORR2D_134]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "144": { + "content": "[RDKit:AUTOCORR2D_135]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "145": { + "content": "[RDKit:AUTOCORR2D_136]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "146": { + "content": "[RDKit:AUTOCORR2D_137]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "147": { + "content": "[RDKit:AUTOCORR2D_138]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "148": { + "content": "[RDKit:AUTOCORR2D_139]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "149": { + "content": "[RDKit:AUTOCORR2D_14]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "150": { + "content": "[RDKit:AUTOCORR2D_140]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "151": { + "content": "[RDKit:AUTOCORR2D_141]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "152": { + "content": "[RDKit:AUTOCORR2D_142]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "153": { + "content": "[RDKit:AUTOCORR2D_143]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "154": { + "content": "[RDKit:AUTOCORR2D_144]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "155": { + "content": "[RDKit:AUTOCORR2D_145]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "156": { + "content": "[RDKit:AUTOCORR2D_146]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "157": { + "content": "[RDKit:AUTOCORR2D_147]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "158": { + "content": "[RDKit:AUTOCORR2D_148]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "159": { + "content": "[RDKit:AUTOCORR2D_149]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "160": { + "content": "[RDKit:AUTOCORR2D_15]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "161": { + "content": "[RDKit:AUTOCORR2D_150]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "162": { + "content": "[RDKit:AUTOCORR2D_151]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "163": { + "content": "[RDKit:AUTOCORR2D_152]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "164": { + "content": "[RDKit:AUTOCORR2D_153]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "165": { + "content": "[RDKit:AUTOCORR2D_154]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "166": { + "content": "[RDKit:AUTOCORR2D_155]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "167": { + "content": "[RDKit:AUTOCORR2D_156]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "168": { + "content": "[RDKit:AUTOCORR2D_157]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "169": { + "content": "[RDKit:AUTOCORR2D_158]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "170": { + "content": "[RDKit:AUTOCORR2D_159]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "171": { + "content": "[RDKit:AUTOCORR2D_16]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "172": { + "content": "[RDKit:AUTOCORR2D_160]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "173": { + "content": "[RDKit:AUTOCORR2D_161]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "174": { + "content": "[RDKit:AUTOCORR2D_162]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "175": { + "content": "[RDKit:AUTOCORR2D_163]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "176": { + "content": "[RDKit:AUTOCORR2D_164]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "177": { + "content": "[RDKit:AUTOCORR2D_165]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "178": { + "content": "[RDKit:AUTOCORR2D_166]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "179": { + "content": "[RDKit:AUTOCORR2D_167]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "180": { + "content": "[RDKit:AUTOCORR2D_168]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "181": { + "content": "[RDKit:AUTOCORR2D_169]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "182": { + "content": "[RDKit:AUTOCORR2D_17]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "183": { + "content": "[RDKit:AUTOCORR2D_170]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "184": { + "content": "[RDKit:AUTOCORR2D_171]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "185": { + "content": "[RDKit:AUTOCORR2D_172]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "186": { + "content": "[RDKit:AUTOCORR2D_173]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "187": { + "content": "[RDKit:AUTOCORR2D_174]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "188": { + "content": "[RDKit:AUTOCORR2D_175]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "189": { + "content": "[RDKit:AUTOCORR2D_176]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "190": { + "content": "[RDKit:AUTOCORR2D_177]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "191": { + "content": "[RDKit:AUTOCORR2D_178]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "192": { + "content": "[RDKit:AUTOCORR2D_179]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "193": { + "content": "[RDKit:AUTOCORR2D_18]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "194": { + "content": "[RDKit:AUTOCORR2D_180]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "195": { + "content": "[RDKit:AUTOCORR2D_181]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "196": { + "content": "[RDKit:AUTOCORR2D_182]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "197": { + "content": "[RDKit:AUTOCORR2D_183]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "198": { + "content": "[RDKit:AUTOCORR2D_184]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "199": { + "content": "[RDKit:AUTOCORR2D_185]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "200": { + "content": "[RDKit:AUTOCORR2D_186]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "201": { + "content": "[RDKit:AUTOCORR2D_187]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "202": { + "content": "[RDKit:AUTOCORR2D_188]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "203": { + "content": "[RDKit:AUTOCORR2D_189]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "204": { + "content": "[RDKit:AUTOCORR2D_19]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "205": { + "content": "[RDKit:AUTOCORR2D_190]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "206": { + "content": "[RDKit:AUTOCORR2D_191]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "207": { + "content": "[RDKit:AUTOCORR2D_192]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "208": { + "content": "[RDKit:AUTOCORR2D_2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "209": { + "content": "[RDKit:AUTOCORR2D_20]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "210": { + "content": "[RDKit:AUTOCORR2D_21]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "211": { + "content": "[RDKit:AUTOCORR2D_22]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "212": { + "content": "[RDKit:AUTOCORR2D_23]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "213": { + "content": "[RDKit:AUTOCORR2D_24]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "214": { + "content": "[RDKit:AUTOCORR2D_25]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "215": { + "content": "[RDKit:AUTOCORR2D_26]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "216": { + "content": "[RDKit:AUTOCORR2D_27]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "217": { + "content": "[RDKit:AUTOCORR2D_28]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "218": { + "content": "[RDKit:AUTOCORR2D_29]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "219": { + "content": "[RDKit:AUTOCORR2D_3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "220": { + "content": "[RDKit:AUTOCORR2D_30]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "221": { + "content": "[RDKit:AUTOCORR2D_31]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "222": { + "content": "[RDKit:AUTOCORR2D_32]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "223": { + "content": "[RDKit:AUTOCORR2D_33]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "224": { + "content": "[RDKit:AUTOCORR2D_34]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "225": { + "content": "[RDKit:AUTOCORR2D_35]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "226": { + "content": "[RDKit:AUTOCORR2D_36]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "227": { + "content": "[RDKit:AUTOCORR2D_37]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "228": { + "content": "[RDKit:AUTOCORR2D_38]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "229": { + "content": "[RDKit:AUTOCORR2D_39]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "230": { + "content": "[RDKit:AUTOCORR2D_4]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "231": { + "content": "[RDKit:AUTOCORR2D_40]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "232": { + "content": "[RDKit:AUTOCORR2D_41]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "233": { + "content": "[RDKit:AUTOCORR2D_42]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "234": { + "content": "[RDKit:AUTOCORR2D_43]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "235": { + "content": "[RDKit:AUTOCORR2D_44]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "236": { + "content": "[RDKit:AUTOCORR2D_45]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "237": { + "content": "[RDKit:AUTOCORR2D_46]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "238": { + "content": "[RDKit:AUTOCORR2D_47]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "239": { + "content": "[RDKit:AUTOCORR2D_48]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "240": { + "content": "[RDKit:AUTOCORR2D_49]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "241": { + "content": "[RDKit:AUTOCORR2D_5]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "242": { + "content": "[RDKit:AUTOCORR2D_50]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "243": { + "content": "[RDKit:AUTOCORR2D_51]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "244": { + "content": "[RDKit:AUTOCORR2D_52]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "245": { + "content": "[RDKit:AUTOCORR2D_53]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "246": { + "content": "[RDKit:AUTOCORR2D_54]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "247": { + "content": "[RDKit:AUTOCORR2D_55]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "248": { + "content": "[RDKit:AUTOCORR2D_56]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "249": { + "content": "[RDKit:AUTOCORR2D_57]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "250": { + "content": "[RDKit:AUTOCORR2D_58]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "251": { + "content": "[RDKit:AUTOCORR2D_59]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "252": { + "content": "[RDKit:AUTOCORR2D_6]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "253": { + "content": "[RDKit:AUTOCORR2D_60]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "254": { + "content": "[RDKit:AUTOCORR2D_61]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "255": { + "content": "[RDKit:AUTOCORR2D_62]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "256": { + "content": "[RDKit:AUTOCORR2D_63]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "257": { + "content": "[RDKit:AUTOCORR2D_64]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "258": { + "content": "[RDKit:AUTOCORR2D_65]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "259": { + "content": "[RDKit:AUTOCORR2D_66]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "260": { + "content": "[RDKit:AUTOCORR2D_67]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "261": { + "content": "[RDKit:AUTOCORR2D_68]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "262": { + "content": "[RDKit:AUTOCORR2D_69]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "263": { + "content": "[RDKit:AUTOCORR2D_7]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "264": { + "content": "[RDKit:AUTOCORR2D_70]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "265": { + "content": "[RDKit:AUTOCORR2D_71]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "266": { + "content": "[RDKit:AUTOCORR2D_72]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "267": { + "content": "[RDKit:AUTOCORR2D_73]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "268": { + "content": "[RDKit:AUTOCORR2D_74]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "269": { + "content": "[RDKit:AUTOCORR2D_75]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "270": { + "content": "[RDKit:AUTOCORR2D_76]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "271": { + "content": "[RDKit:AUTOCORR2D_77]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "272": { + "content": "[RDKit:AUTOCORR2D_78]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "273": { + "content": "[RDKit:AUTOCORR2D_79]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "274": { + "content": "[RDKit:AUTOCORR2D_8]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "275": { + "content": "[RDKit:AUTOCORR2D_80]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "276": { + "content": "[RDKit:AUTOCORR2D_81]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "277": { + "content": "[RDKit:AUTOCORR2D_82]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "278": { + "content": "[RDKit:AUTOCORR2D_83]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "279": { + "content": "[RDKit:AUTOCORR2D_84]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "280": { + "content": "[RDKit:AUTOCORR2D_85]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "281": { + "content": "[RDKit:AUTOCORR2D_86]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "282": { + "content": "[RDKit:AUTOCORR2D_87]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "283": { + "content": "[RDKit:AUTOCORR2D_88]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "284": { + "content": "[RDKit:AUTOCORR2D_89]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "285": { + "content": "[RDKit:AUTOCORR2D_9]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "286": { + "content": "[RDKit:AUTOCORR2D_90]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "287": { + "content": "[RDKit:AUTOCORR2D_91]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "288": { + "content": "[RDKit:AUTOCORR2D_92]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "289": { + "content": "[RDKit:AUTOCORR2D_93]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "290": { + "content": "[RDKit:AUTOCORR2D_94]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "291": { + "content": "[RDKit:AUTOCORR2D_95]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "292": { + "content": "[RDKit:AUTOCORR2D_96]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "293": { + "content": "[RDKit:AUTOCORR2D_97]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "294": { + "content": "[RDKit:AUTOCORR2D_98]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "295": { + "content": "[RDKit:AUTOCORR2D_99]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "296": { + "content": "[RDKit:AvgIpc]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "297": { + "content": "[RDKit:BCUT2D_CHGHI]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "298": { + "content": "[RDKit:BCUT2D_CHGLO]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "299": { + "content": "[RDKit:BCUT2D_LOGPHI]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "300": { + "content": "[RDKit:BCUT2D_LOGPLOW]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "301": { + "content": "[RDKit:BCUT2D_MRHI]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "302": { + "content": "[RDKit:BCUT2D_MRLOW]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "303": { + "content": "[RDKit:BCUT2D_MWHI]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "304": { + "content": "[RDKit:BCUT2D_MWLOW]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "305": { + "content": "[RDKit:BalabanJ]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "306": { + "content": "[RDKit:BertzCT]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "307": { + "content": "[RDKit:Chi0]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "308": { + "content": "[RDKit:Chi0n]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "309": { + "content": "[RDKit:Chi0v]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "310": { + "content": "[RDKit:Chi1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "311": { + "content": "[RDKit:Chi1n]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "312": { + "content": "[RDKit:Chi1v]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "313": { + "content": "[RDKit:Chi2n]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "314": { + "content": "[RDKit:Chi2v]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "315": { + "content": "[RDKit:Chi3n]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "316": { + "content": "[RDKit:Chi3v]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "317": { + "content": "[RDKit:Chi4n]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "318": { + "content": "[RDKit:Chi4v]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "319": { + "content": "[RDKit:EState_VSA1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "320": { + "content": "[RDKit:EState_VSA10]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "321": { + "content": "[RDKit:EState_VSA11]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "322": { + "content": "[RDKit:EState_VSA2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "323": { + "content": "[RDKit:EState_VSA3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "324": { + "content": "[RDKit:EState_VSA4]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "325": { + "content": "[RDKit:EState_VSA5]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "326": { + "content": "[RDKit:EState_VSA6]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "327": { + "content": "[RDKit:EState_VSA7]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "328": { + "content": "[RDKit:EState_VSA8]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "329": { + "content": "[RDKit:EState_VSA9]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "330": { + "content": "[RDKit:ExactMolWt]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "331": { + "content": "[RDKit:FpDensityMorgan1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "332": { + "content": "[RDKit:FpDensityMorgan2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "333": { + "content": "[RDKit:FpDensityMorgan3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "334": { + "content": "[RDKit:HallKierAlpha]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "335": { + "content": "[RDKit:HeavyAtomMolWt]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "336": { + "content": "[RDKit:Ipc]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "337": { + "content": "[RDKit:Kappa1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "338": { + "content": "[RDKit:Kappa2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "339": { + "content": "[RDKit:Kappa3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "340": { + "content": "[RDKit:LabuteASA]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "341": { + "content": "[RDKit:MaxAbsEStateIndex]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "342": { + "content": "[RDKit:MaxAbsPartialCharge]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "343": { + "content": "[RDKit:MaxEStateIndex]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "344": { + "content": "[RDKit:MaxPartialCharge]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "345": { + "content": "[RDKit:MinAbsEStateIndex]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "346": { + "content": "[RDKit:MinAbsPartialCharge]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "347": { + "content": "[RDKit:MinEStateIndex]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "348": { + "content": "[RDKit:MinPartialCharge]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "349": { + "content": "[RDKit:MolLogP]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "350": { + "content": "[RDKit:MolMR]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "351": { + "content": "[RDKit:MolWt]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "352": { + "content": "[RDKit:NumRadicalElectrons]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "353": { + "content": "[RDKit:NumValenceElectrons]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "354": { + "content": "[RDKit:PEOE_VSA1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "355": { + "content": "[RDKit:PEOE_VSA10]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "356": { + "content": "[RDKit:PEOE_VSA11]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "357": { + "content": "[RDKit:PEOE_VSA12]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "358": { + "content": "[RDKit:PEOE_VSA13]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "359": { + "content": "[RDKit:PEOE_VSA14]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "360": { + "content": "[RDKit:PEOE_VSA2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "361": { + "content": "[RDKit:PEOE_VSA3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "362": { + "content": "[RDKit:PEOE_VSA4]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "363": { + "content": "[RDKit:PEOE_VSA5]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "364": { + "content": "[RDKit:PEOE_VSA6]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "365": { + "content": "[RDKit:PEOE_VSA7]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "366": { + "content": "[RDKit:PEOE_VSA8]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "367": { + "content": "[RDKit:PEOE_VSA9]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "368": { + "content": "[RDKit:SMR_VSA1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "369": { + "content": "[RDKit:SMR_VSA10]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "370": { + "content": "[RDKit:SMR_VSA2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "371": { + "content": "[RDKit:SMR_VSA3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "372": { + "content": "[RDKit:SMR_VSA4]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "373": { + "content": "[RDKit:SMR_VSA5]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "374": { + "content": "[RDKit:SMR_VSA6]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "375": { + "content": "[RDKit:SMR_VSA7]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "376": { + "content": "[RDKit:SMR_VSA8]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "377": { + "content": "[RDKit:SMR_VSA9]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "378": { + "content": "[RDKit:SPS]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "379": { + "content": "[RDKit:SlogP_VSA1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "380": { + "content": "[RDKit:SlogP_VSA10]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "381": { + "content": "[RDKit:SlogP_VSA11]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "382": { + "content": "[RDKit:SlogP_VSA12]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "383": { + "content": "[RDKit:SlogP_VSA2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "384": { + "content": "[RDKit:SlogP_VSA3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "385": { + "content": "[RDKit:SlogP_VSA4]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "386": { + "content": "[RDKit:SlogP_VSA5]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "387": { + "content": "[RDKit:SlogP_VSA6]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "388": { + "content": "[RDKit:SlogP_VSA7]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "389": { + "content": "[RDKit:SlogP_VSA8]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "390": { + "content": "[RDKit:SlogP_VSA9]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "391": { + "content": "[RDKit:TPSA]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "392": { + "content": "[RDKit:VSA_EState1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "393": { + "content": "[RDKit:VSA_EState10]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "394": { + "content": "[RDKit:VSA_EState2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "395": { + "content": "[RDKit:VSA_EState3]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "396": { + "content": "[RDKit:VSA_EState4]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "397": { + "content": "[RDKit:VSA_EState5]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "398": { + "content": "[RDKit:VSA_EState6]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "399": { + "content": "[RDKit:VSA_EState7]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "400": { + "content": "[RDKit:VSA_EState8]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "401": { + "content": "[RDKit:VSA_EState9]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "402": { + "content": "[RDKit:fr_Al_COO]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "403": { + "content": "[RDKit:fr_Al_OH]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "404": { + "content": "[RDKit:fr_Al_OH_noTert]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "405": { + "content": "[RDKit:fr_ArN]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "406": { + "content": "[RDKit:fr_Ar_COO]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "407": { + "content": "[RDKit:fr_Ar_N]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "408": { + "content": "[RDKit:fr_Ar_NH]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "409": { + "content": "[RDKit:fr_Ar_OH]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "410": { + "content": "[RDKit:fr_COO]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "411": { + "content": "[RDKit:fr_COO2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "412": { + "content": "[RDKit:fr_C_O]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "413": { + "content": "[RDKit:fr_C_O_noCOO]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "414": { + "content": "[RDKit:fr_C_S]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "415": { + "content": "[RDKit:fr_HOCCN]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "416": { + "content": "[RDKit:fr_Imine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "417": { + "content": "[RDKit:fr_NH0]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "418": { + "content": "[RDKit:fr_NH1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "419": { + "content": "[RDKit:fr_NH2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "420": { + "content": "[RDKit:fr_N_O]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "421": { + "content": "[RDKit:fr_Ndealkylation1]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "422": { + "content": "[RDKit:fr_Ndealkylation2]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "423": { + "content": "[RDKit:fr_Nhpyrrole]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "424": { + "content": "[RDKit:fr_SH]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "425": { + "content": "[RDKit:fr_aldehyde]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "426": { + "content": "[RDKit:fr_alkyl_carbamate]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "427": { + "content": "[RDKit:fr_alkyl_halide]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "428": { + "content": "[RDKit:fr_allylic_oxid]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "429": { + "content": "[RDKit:fr_amide]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "430": { + "content": "[RDKit:fr_amidine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "431": { + "content": "[RDKit:fr_aniline]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "432": { + "content": "[RDKit:fr_aryl_methyl]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "433": { + "content": "[RDKit:fr_azide]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "434": { + "content": "[RDKit:fr_azo]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "435": { + "content": "[RDKit:fr_barbitur]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "436": { + "content": "[RDKit:fr_benzene]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "437": { + "content": "[RDKit:fr_benzodiazepine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "438": { + "content": "[RDKit:fr_bicyclic]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "439": { + "content": "[RDKit:fr_diazo]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "440": { + "content": "[RDKit:fr_dihydropyridine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "441": { + "content": "[RDKit:fr_epoxide]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "442": { + "content": "[RDKit:fr_ester]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "443": { + "content": "[RDKit:fr_ether]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "444": { + "content": "[RDKit:fr_furan]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "445": { + "content": "[RDKit:fr_guanido]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "446": { + "content": "[RDKit:fr_halogen]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "447": { + "content": "[RDKit:fr_hdrzine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "448": { + "content": "[RDKit:fr_hdrzone]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "449": { + "content": "[RDKit:fr_imidazole]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "450": { + "content": "[RDKit:fr_imide]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "451": { + "content": "[RDKit:fr_isocyan]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "452": { + "content": "[RDKit:fr_isothiocyan]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "453": { + "content": "[RDKit:fr_ketone]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "454": { + "content": "[RDKit:fr_ketone_Topliss]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "455": { + "content": "[RDKit:fr_lactam]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "456": { + "content": "[RDKit:fr_lactone]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "457": { + "content": "[RDKit:fr_methoxy]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "458": { + "content": "[RDKit:fr_morpholine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "459": { + "content": "[RDKit:fr_nitrile]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "460": { + "content": "[RDKit:fr_nitro]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "461": { + "content": "[RDKit:fr_nitro_arom]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "462": { + "content": "[RDKit:fr_nitro_arom_nonortho]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "463": { + "content": "[RDKit:fr_nitroso]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "464": { + "content": "[RDKit:fr_oxazole]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "465": { + "content": "[RDKit:fr_oxime]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "466": { + "content": "[RDKit:fr_para_hydroxylation]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "467": { + "content": "[RDKit:fr_phenol]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "468": { + "content": "[RDKit:fr_phenol_noOrthoHbond]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "469": { + "content": "[RDKit:fr_phos_acid]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "470": { + "content": "[RDKit:fr_phos_ester]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "471": { + "content": "[RDKit:fr_piperdine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "472": { + "content": "[RDKit:fr_piperzine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "473": { + "content": "[RDKit:fr_priamide]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "474": { + "content": "[RDKit:fr_prisulfonamd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "475": { + "content": "[RDKit:fr_pyridine]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "476": { + "content": "[RDKit:fr_quatN]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "477": { + "content": "[RDKit:fr_sulfide]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "478": { + "content": "[RDKit:fr_sulfonamd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "479": { + "content": "[RDKit:fr_sulfone]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "480": { + "content": "[RDKit:fr_term_acetylene]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "481": { + "content": "[RDKit:fr_tetrazole]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "482": { + "content": "[RDKit:fr_thiazole]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "483": { + "content": "[RDKit:fr_thiocyan]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "484": { + "content": "[RDKit:fr_thiophene]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "485": { + "content": "[RDKit:fr_unbrch_alkane]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "486": { + "content": "[RDKit:fr_urea]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "487": { + "content": "[RDKit:qed]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "488": { + "content": ";", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "489": { + "content": ",", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "490": { + "content": "[sMLM_smi]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "491": { + "content": "[sMLM_pro]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "492": { + "content": "[sMLM_val]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "493": { + "content": "[mMLM]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "494": { + "content": "[sPLM_smi]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "495": { + "content": "[sPLM_pro_val]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "496": { + "content": "[mPLM]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "497": { + "content": "[sPPLM_smi]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "498": { + "content": "[sPPLM_pro_val]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "499": { + "content": "[mPPLM]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "500": { + "content": "[sGLM_smi]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "501": { + "content": "[sGLM_pro]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "502": { + "content": "[sGLM_val]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "503": { + "content": "[mGLM_pro_val]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "504": { + "content": "[sPGLM_smi]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "505": { + "content": "[sPGLM_pro]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "506": { + "content": "[sPGLM_val]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "507": { + "content": "[mPGLM_smi_pro]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "508": { + "content": "[mPGLM_smi_val]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "509": { + "content": "[sPPM]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "510": { + "content": "[mPPM]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "511": { + "content": "[SPM_DDD]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "512": { + "content": "[SPM_AAD]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "513": { + "content": "[SPM_XYZ]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "514": { + "content": "[sMLM_smi(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "515": { + "content": "[sMLM_pro(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "516": { + "content": "[sMLM_val(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "517": { + "content": "[mMLM(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "518": { + "content": "[sPLM_smi(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "519": { + "content": "[sPLM_pro_val(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "520": { + "content": "[mPLM(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "521": { + "content": "[sPPLM_smi(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "522": { + "content": "[sPPLM_pro_val(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "523": { + "content": "[mPPLM(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "524": { + "content": "[sGLM_smi(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "525": { + "content": "[sGLM_pro(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "526": { + "content": "[sGLM_val(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "527": { + "content": "[mGLM_pro_val(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "528": { + "content": "[sPGLM_smi(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "529": { + "content": "[sPGLM_pro(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "530": { + "content": "[sPGLM_val(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "531": { + "content": "[mPGLM_smi_pro(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "532": { + "content": "[mPGLM_smi_val(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "533": { + "content": "[sPPM(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "534": { + "content": "[mPPM(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "535": { + "content": "[SPM_DDD(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "536": { + "content": "[SPM_AAD(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "537": { + "content": "[SPM_XYZ(PAIR)]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "538": { + "content": "[(DDD)ATOM:Ac]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "539": { + "content": "[(DDD)ATOM:Ag]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "540": { + "content": "[(DDD)ATOM:Al]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "541": { + "content": "[(DDD)ATOM:Am]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "542": { + "content": "[(DDD)ATOM:Ar]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "543": { + "content": "[(DDD)ATOM:As]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "544": { + "content": "[(DDD)ATOM:At]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "545": { + "content": "[(DDD)ATOM:Au]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "546": { + "content": "[(DDD)ATOM:B]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "547": { + "content": "[(DDD)ATOM:Ba]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "548": { + "content": "[(DDD)ATOM:Be]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "549": { + "content": "[(DDD)ATOM:Bi]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "550": { + "content": "[(DDD)ATOM:Bk]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "551": { + "content": "[(DDD)ATOM:Br]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "552": { + "content": "[(DDD)ATOM:C]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "553": { + "content": "[(DDD)ATOM:Ca]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "554": { + "content": "[(DDD)ATOM:Cd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "555": { + "content": "[(DDD)ATOM:Ce]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "556": { + "content": "[(DDD)ATOM:Cf]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "557": { + "content": "[(DDD)ATOM:Cl]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "558": { + "content": "[(DDD)ATOM:Cm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "559": { + "content": "[(DDD)ATOM:Co]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "560": { + "content": "[(DDD)ATOM:Cr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "561": { + "content": "[(DDD)ATOM:Cs]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "562": { + "content": "[(DDD)ATOM:Cu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "563": { + "content": "[(DDD)ATOM:Dy]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "564": { + "content": "[(DDD)ATOM:Er]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "565": { + "content": "[(DDD)ATOM:Es]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "566": { + "content": "[(DDD)ATOM:Eu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "567": { + "content": "[(DDD)ATOM:F]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "568": { + "content": "[(DDD)ATOM:Fe]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "569": { + "content": "[(DDD)ATOM:Fm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "570": { + "content": "[(DDD)ATOM:Ga]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "571": { + "content": "[(DDD)ATOM:Gd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "572": { + "content": "[(DDD)ATOM:Ge]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "573": { + "content": "[(DDD)ATOM:He]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "574": { + "content": "[(DDD)ATOM:Hf]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "575": { + "content": "[(DDD)ATOM:Hg]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "576": { + "content": "[(DDD)ATOM:Ho]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "577": { + "content": "[(DDD)ATOM:I]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "578": { + "content": "[(DDD)ATOM:In]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "579": { + "content": "[(DDD)ATOM:Ir]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "580": { + "content": "[(DDD)ATOM:K]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "581": { + "content": "[(DDD)ATOM:Kr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "582": { + "content": "[(DDD)ATOM:La]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "583": { + "content": "[(DDD)ATOM:Li]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "584": { + "content": "[(DDD)ATOM:Lr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "585": { + "content": "[(DDD)ATOM:Lu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "586": { + "content": "[(DDD)ATOM:Md]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "587": { + "content": "[(DDD)ATOM:Mg]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "588": { + "content": "[(DDD)ATOM:Mn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "589": { + "content": "[(DDD)ATOM:Mo]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "590": { + "content": "[(DDD)ATOM:N]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "591": { + "content": "[(DDD)ATOM:Na]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "592": { + "content": "[(DDD)ATOM:Nb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "593": { + "content": "[(DDD)ATOM:Nd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "594": { + "content": "[(DDD)ATOM:Ne]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "595": { + "content": "[(DDD)ATOM:Ni]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "596": { + "content": "[(DDD)ATOM:No]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "597": { + "content": "[(DDD)ATOM:Np]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "598": { + "content": "[(DDD)ATOM:O]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "599": { + "content": "[(DDD)ATOM:Os]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "600": { + "content": "[(DDD)ATOM:P]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "601": { + "content": "[(DDD)ATOM:Pa]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "602": { + "content": "[(DDD)ATOM:Pb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "603": { + "content": "[(DDD)ATOM:Pd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "604": { + "content": "[(DDD)ATOM:Pm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "605": { + "content": "[(DDD)ATOM:Po]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "606": { + "content": "[(DDD)ATOM:Pr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "607": { + "content": "[(DDD)ATOM:Pt]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "608": { + "content": "[(DDD)ATOM:Pu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "609": { + "content": "[(DDD)ATOM:Rb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "610": { + "content": "[(DDD)ATOM:Re]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "611": { + "content": "[(DDD)ATOM:Rh]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "612": { + "content": "[(DDD)ATOM:Rn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "613": { + "content": "[(DDD)ATOM:Ru]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "614": { + "content": "[(DDD)ATOM:S]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "615": { + "content": "[(DDD)ATOM:Sb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "616": { + "content": "[(DDD)ATOM:Sc]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "617": { + "content": "[(DDD)ATOM:Se]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "618": { + "content": "[(DDD)ATOM:Si]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "619": { + "content": "[(DDD)ATOM:Sm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "620": { + "content": "[(DDD)ATOM:Sn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "621": { + "content": "[(DDD)ATOM:Sr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "622": { + "content": "[(DDD)ATOM:Ta]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "623": { + "content": "[(DDD)ATOM:Tb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "624": { + "content": "[(DDD)ATOM:Tc]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "625": { + "content": "[(DDD)ATOM:Te]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "626": { + "content": "[(DDD)ATOM:Th]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "627": { + "content": "[(DDD)ATOM:Ti]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "628": { + "content": "[(DDD)ATOM:Tl]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "629": { + "content": "[(DDD)ATOM:Tm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "630": { + "content": "[(DDD)ATOM:U]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "631": { + "content": "[(DDD)ATOM:V]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "632": { + "content": "[(DDD)ATOM:W]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "633": { + "content": "[(DDD)ATOM:Xe]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "634": { + "content": "[(DDD)ATOM:Y]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "635": { + "content": "[(DDD)ATOM:Yb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "636": { + "content": "[(DDD)ATOM:Zn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "637": { + "content": "[(DDD)ATOM:Zr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "638": { + "content": "[(AAD)ATOM:Ac]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "639": { + "content": "[(AAD)ATOM:Ag]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "640": { + "content": "[(AAD)ATOM:Al]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "641": { + "content": "[(AAD)ATOM:Am]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "642": { + "content": "[(AAD)ATOM:Ar]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "643": { + "content": "[(AAD)ATOM:As]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "644": { + "content": "[(AAD)ATOM:At]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "645": { + "content": "[(AAD)ATOM:Au]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "646": { + "content": "[(AAD)ATOM:B]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "647": { + "content": "[(AAD)ATOM:Ba]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "648": { + "content": "[(AAD)ATOM:Be]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "649": { + "content": "[(AAD)ATOM:Bi]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "650": { + "content": "[(AAD)ATOM:Bk]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "651": { + "content": "[(AAD)ATOM:Br]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "652": { + "content": "[(AAD)ATOM:C]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "653": { + "content": "[(AAD)ATOM:Ca]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "654": { + "content": "[(AAD)ATOM:Cd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "655": { + "content": "[(AAD)ATOM:Ce]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "656": { + "content": "[(AAD)ATOM:Cf]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "657": { + "content": "[(AAD)ATOM:Cl]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "658": { + "content": "[(AAD)ATOM:Cm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "659": { + "content": "[(AAD)ATOM:Co]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "660": { + "content": "[(AAD)ATOM:Cr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "661": { + "content": "[(AAD)ATOM:Cs]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "662": { + "content": "[(AAD)ATOM:Cu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "663": { + "content": "[(AAD)ATOM:Dy]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "664": { + "content": "[(AAD)ATOM:Er]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "665": { + "content": "[(AAD)ATOM:Es]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "666": { + "content": "[(AAD)ATOM:Eu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "667": { + "content": "[(AAD)ATOM:F]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "668": { + "content": "[(AAD)ATOM:Fe]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "669": { + "content": "[(AAD)ATOM:Fm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "670": { + "content": "[(AAD)ATOM:Ga]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "671": { + "content": "[(AAD)ATOM:Gd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "672": { + "content": "[(AAD)ATOM:Ge]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "673": { + "content": "[(AAD)ATOM:He]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "674": { + "content": "[(AAD)ATOM:Hf]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "675": { + "content": "[(AAD)ATOM:Hg]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "676": { + "content": "[(AAD)ATOM:Ho]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "677": { + "content": "[(AAD)ATOM:I]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "678": { + "content": "[(AAD)ATOM:In]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "679": { + "content": "[(AAD)ATOM:Ir]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "680": { + "content": "[(AAD)ATOM:K]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "681": { + "content": "[(AAD)ATOM:Kr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "682": { + "content": "[(AAD)ATOM:La]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "683": { + "content": "[(AAD)ATOM:Li]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "684": { + "content": "[(AAD)ATOM:Lr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "685": { + "content": "[(AAD)ATOM:Lu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "686": { + "content": "[(AAD)ATOM:Md]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "687": { + "content": "[(AAD)ATOM:Mg]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "688": { + "content": "[(AAD)ATOM:Mn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "689": { + "content": "[(AAD)ATOM:Mo]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "690": { + "content": "[(AAD)ATOM:N]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "691": { + "content": "[(AAD)ATOM:Na]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "692": { + "content": "[(AAD)ATOM:Nb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "693": { + "content": "[(AAD)ATOM:Nd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "694": { + "content": "[(AAD)ATOM:Ne]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "695": { + "content": "[(AAD)ATOM:Ni]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "696": { + "content": "[(AAD)ATOM:No]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "697": { + "content": "[(AAD)ATOM:Np]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "698": { + "content": "[(AAD)ATOM:O]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "699": { + "content": "[(AAD)ATOM:Os]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "700": { + "content": "[(AAD)ATOM:P]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "701": { + "content": "[(AAD)ATOM:Pa]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "702": { + "content": "[(AAD)ATOM:Pb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "703": { + "content": "[(AAD)ATOM:Pd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "704": { + "content": "[(AAD)ATOM:Pm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "705": { + "content": "[(AAD)ATOM:Po]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "706": { + "content": "[(AAD)ATOM:Pr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "707": { + "content": "[(AAD)ATOM:Pt]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "708": { + "content": "[(AAD)ATOM:Pu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "709": { + "content": "[(AAD)ATOM:Rb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "710": { + "content": "[(AAD)ATOM:Re]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "711": { + "content": "[(AAD)ATOM:Rh]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "712": { + "content": "[(AAD)ATOM:Rn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "713": { + "content": "[(AAD)ATOM:Ru]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "714": { + "content": "[(AAD)ATOM:S]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "715": { + "content": "[(AAD)ATOM:Sb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "716": { + "content": "[(AAD)ATOM:Sc]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "717": { + "content": "[(AAD)ATOM:Se]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "718": { + "content": "[(AAD)ATOM:Si]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "719": { + "content": "[(AAD)ATOM:Sm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "720": { + "content": "[(AAD)ATOM:Sn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "721": { + "content": "[(AAD)ATOM:Sr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "722": { + "content": "[(AAD)ATOM:Ta]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "723": { + "content": "[(AAD)ATOM:Tb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "724": { + "content": "[(AAD)ATOM:Tc]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "725": { + "content": "[(AAD)ATOM:Te]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "726": { + "content": "[(AAD)ATOM:Th]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "727": { + "content": "[(AAD)ATOM:Ti]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "728": { + "content": "[(AAD)ATOM:Tl]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "729": { + "content": "[(AAD)ATOM:Tm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "730": { + "content": "[(AAD)ATOM:U]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "731": { + "content": "[(AAD)ATOM:V]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "732": { + "content": "[(AAD)ATOM:W]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "733": { + "content": "[(AAD)ATOM:Xe]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "734": { + "content": "[(AAD)ATOM:Y]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "735": { + "content": "[(AAD)ATOM:Yb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "736": { + "content": "[(AAD)ATOM:Zn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "737": { + "content": "[(AAD)ATOM:Zr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "738": { + "content": "[(XYZ)ATOM:Ac]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "739": { + "content": "[(XYZ)ATOM:Ag]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "740": { + "content": "[(XYZ)ATOM:Al]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "741": { + "content": "[(XYZ)ATOM:Am]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "742": { + "content": "[(XYZ)ATOM:Ar]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "743": { + "content": "[(XYZ)ATOM:As]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "744": { + "content": "[(XYZ)ATOM:At]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "745": { + "content": "[(XYZ)ATOM:Au]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "746": { + "content": "[(XYZ)ATOM:B]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "747": { + "content": "[(XYZ)ATOM:Ba]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "748": { + "content": "[(XYZ)ATOM:Be]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "749": { + "content": "[(XYZ)ATOM:Bi]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "750": { + "content": "[(XYZ)ATOM:Bk]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "751": { + "content": "[(XYZ)ATOM:Br]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "752": { + "content": "[(XYZ)ATOM:C]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "753": { + "content": "[(XYZ)ATOM:Ca]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "754": { + "content": "[(XYZ)ATOM:Cd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "755": { + "content": "[(XYZ)ATOM:Ce]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "756": { + "content": "[(XYZ)ATOM:Cf]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "757": { + "content": "[(XYZ)ATOM:Cl]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "758": { + "content": "[(XYZ)ATOM:Cm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "759": { + "content": "[(XYZ)ATOM:Co]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "760": { + "content": "[(XYZ)ATOM:Cr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "761": { + "content": "[(XYZ)ATOM:Cs]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "762": { + "content": "[(XYZ)ATOM:Cu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "763": { + "content": "[(XYZ)ATOM:Dy]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "764": { + "content": "[(XYZ)ATOM:Er]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "765": { + "content": "[(XYZ)ATOM:Es]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "766": { + "content": "[(XYZ)ATOM:Eu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "767": { + "content": "[(XYZ)ATOM:F]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "768": { + "content": "[(XYZ)ATOM:Fe]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "769": { + "content": "[(XYZ)ATOM:Fm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "770": { + "content": "[(XYZ)ATOM:Ga]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "771": { + "content": "[(XYZ)ATOM:Gd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "772": { + "content": "[(XYZ)ATOM:Ge]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "773": { + "content": "[(XYZ)ATOM:He]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "774": { + "content": "[(XYZ)ATOM:Hf]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "775": { + "content": "[(XYZ)ATOM:Hg]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "776": { + "content": "[(XYZ)ATOM:Ho]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "777": { + "content": "[(XYZ)ATOM:I]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "778": { + "content": "[(XYZ)ATOM:In]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "779": { + "content": "[(XYZ)ATOM:Ir]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "780": { + "content": "[(XYZ)ATOM:K]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "781": { + "content": "[(XYZ)ATOM:Kr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "782": { + "content": "[(XYZ)ATOM:La]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "783": { + "content": "[(XYZ)ATOM:Li]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "784": { + "content": "[(XYZ)ATOM:Lr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "785": { + "content": "[(XYZ)ATOM:Lu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "786": { + "content": "[(XYZ)ATOM:Md]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "787": { + "content": "[(XYZ)ATOM:Mg]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "788": { + "content": "[(XYZ)ATOM:Mn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "789": { + "content": "[(XYZ)ATOM:Mo]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "790": { + "content": "[(XYZ)ATOM:N]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "791": { + "content": "[(XYZ)ATOM:Na]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "792": { + "content": "[(XYZ)ATOM:Nb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "793": { + "content": "[(XYZ)ATOM:Nd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "794": { + "content": "[(XYZ)ATOM:Ne]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "795": { + "content": "[(XYZ)ATOM:Ni]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "796": { + "content": "[(XYZ)ATOM:No]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "797": { + "content": "[(XYZ)ATOM:Np]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "798": { + "content": "[(XYZ)ATOM:O]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "799": { + "content": "[(XYZ)ATOM:Os]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "800": { + "content": "[(XYZ)ATOM:P]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "801": { + "content": "[(XYZ)ATOM:Pa]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "802": { + "content": "[(XYZ)ATOM:Pb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "803": { + "content": "[(XYZ)ATOM:Pd]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "804": { + "content": "[(XYZ)ATOM:Pm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "805": { + "content": "[(XYZ)ATOM:Po]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "806": { + "content": "[(XYZ)ATOM:Pr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "807": { + "content": "[(XYZ)ATOM:Pt]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "808": { + "content": "[(XYZ)ATOM:Pu]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "809": { + "content": "[(XYZ)ATOM:Rb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "810": { + "content": "[(XYZ)ATOM:Re]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "811": { + "content": "[(XYZ)ATOM:Rh]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "812": { + "content": "[(XYZ)ATOM:Rn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "813": { + "content": "[(XYZ)ATOM:Ru]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "814": { + "content": "[(XYZ)ATOM:S]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "815": { + "content": "[(XYZ)ATOM:Sb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "816": { + "content": "[(XYZ)ATOM:Sc]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "817": { + "content": "[(XYZ)ATOM:Se]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "818": { + "content": "[(XYZ)ATOM:Si]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "819": { + "content": "[(XYZ)ATOM:Sm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "820": { + "content": "[(XYZ)ATOM:Sn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "821": { + "content": "[(XYZ)ATOM:Sr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "822": { + "content": "[(XYZ)ATOM:Ta]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "823": { + "content": "[(XYZ)ATOM:Tb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "824": { + "content": "[(XYZ)ATOM:Tc]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "825": { + "content": "[(XYZ)ATOM:Te]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "826": { + "content": "[(XYZ)ATOM:Th]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "827": { + "content": "[(XYZ)ATOM:Ti]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "828": { + "content": "[(XYZ)ATOM:Tl]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "829": { + "content": "[(XYZ)ATOM:Tm]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "830": { + "content": "[(XYZ)ATOM:U]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "831": { + "content": "[(XYZ)ATOM:V]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "832": { + "content": "[(XYZ)ATOM:W]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "833": { + "content": "[(XYZ)ATOM:Xe]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "834": { + "content": "[(XYZ)ATOM:Y]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "835": { + "content": "[(XYZ)ATOM:Yb]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "836": { + "content": "[(XYZ)ATOM:Zn]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "837": { + "content": "[(XYZ)ATOM:Zr]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "838": { + "content": "[FPR:MACCS]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "839": { + "content": "[FPR:Toplogical]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "840": { + "content": "[FPR:ECFP]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "841": { + "content": "[FPR:FCFP]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "842": { + "content": "[FPR:Avalon]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "843": { + "content": "[SEP]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": true + }, + "844": { + "content": "[SPAN]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "845": { + "content": "[VALUE]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "846": { + "content": "[XYZ]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "847": { + "content": "[BITS]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "848": { + "content": "[CUSPRO]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "849": { + "content": "[SUB]", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": false + }, + "850": { + "content": "[CLS]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "clean_up_tokenization_spaces": true, + "cls_token": "[CLS]", + "do_lower_case": false, + "mask_token": "[MASK]", + "model_max_length": 1000000000000000019884624838656, + "pad_token": "[PAD]", + "sep_token": "[SEP]", + "strip_accents": null, + "tokenize_chinese_chars": true, + "tokenizer_class": "BertTokenizer", + "unk_token": "[UNK]" +} diff --git a/vocab.txt b/vocab.txt new file mode 100644 index 0000000..8958bd7 --- /dev/null +++ b/vocab.txt @@ -0,0 +1,71 @@ +[PAD] +[SOS] +[EOS] +[UNK] +[MASK] +# +( +) ++ +- +. +/ +0 +1 +2 +3 +4 +5 +6 +7 +8 +9 += +@ +A +B +C +D +E +F +G +H +I +K +L +M +N +O +P +R +S +T +U +V +W +X +Y +Z +[ +\ +] +a +b +c +d +e +f +g +h +i +k +l +m +n +o +p +r +s +t +u +y