molSimplify 1.7.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- docs/source/conf.py +224 -0
- molSimplify/Classes/__init__.py +6 -0
- molSimplify/Classes/atom3D.py +235 -0
- molSimplify/Classes/dft_obs.py +130 -0
- molSimplify/Classes/globalvars.py +827 -0
- molSimplify/Classes/helpers.py +161 -0
- molSimplify/Classes/ligand.py +2330 -0
- molSimplify/Classes/mGUI.py +2493 -0
- molSimplify/Classes/mWidgets.py +438 -0
- molSimplify/Classes/miniGUI.py +41 -0
- molSimplify/Classes/mol2D.py +260 -0
- molSimplify/Classes/mol3D.py +5846 -0
- molSimplify/Classes/monomer3D.py +253 -0
- molSimplify/Classes/partialcharges.py +226 -0
- molSimplify/Classes/protein3D.py +1178 -0
- molSimplify/Classes/rundiag.py +151 -0
- molSimplify/Data/ML.dat +212 -0
- molSimplify/Data/MLS_FSR_for_inter.dat +23 -0
- molSimplify/Data/MLS_FSR_for_inter2.dat +23 -0
- molSimplify/Data/MLS_angle_for_click.dat +8 -0
- molSimplify/Data/MLS_angle_for_inter.dat +23 -0
- molSimplify/Data/MLS_angle_for_inter2.dat +48 -0
- molSimplify/Data/MLS_angle_for_intra.dat +10 -0
- molSimplify/Data/MLS_angle_for_intra2.dat +6 -0
- molSimplify/Data/MLS_angle_for_oa.dat +18 -0
- molSimplify/Data/ML_FSR_for_inter.dat +112 -0
- molSimplify/Data/ML_FSR_for_inter2.dat +110 -0
- molSimplify/Data/ML_bond_for_cat.dat +8 -0
- molSimplify/Data/ML_bond_for_click.dat +8 -0
- molSimplify/Data/ML_bond_for_inter.dat +48 -0
- molSimplify/Data/ML_bond_for_inter2.dat +48 -0
- molSimplify/Data/ML_bond_for_intra.dat +10 -0
- molSimplify/Data/ML_bond_for_intra2.dat +6 -0
- molSimplify/Data/ML_bond_for_oa.dat +18 -0
- molSimplify/Data/bp1.dat +21 -0
- molSimplify/Data/li.dat +3 -0
- molSimplify/Data/no.dat +2 -0
- molSimplify/Data/oct.dat +7 -0
- molSimplify/Data/pbp.dat +8 -0
- molSimplify/Data/spy.dat +6 -0
- molSimplify/Data/sqap.dat +9 -0
- molSimplify/Data/sqp.dat +5 -0
- molSimplify/Data/tbp.dat +6 -0
- molSimplify/Data/tdhd.dat +9 -0
- molSimplify/Data/thd.dat +5 -0
- molSimplify/Data/tpl.dat +4 -0
- molSimplify/Data/tpr.dat +7 -0
- molSimplify/Informatics/HFXsensitivity/__init__.py +0 -0
- molSimplify/Informatics/HFXsensitivity/measure_HFX_sensitivity_oxo_hat_reb_rel.py +443 -0
- molSimplify/Informatics/HFXsensitivity/measure_HFX_stable.py +346 -0
- molSimplify/Informatics/MOF/Linker_rotation.py +179 -0
- molSimplify/Informatics/MOF/MOF_descriptors.py +1299 -0
- molSimplify/Informatics/MOF/MOF_descriptors_alternate_functional.py +589 -0
- molSimplify/Informatics/MOF/MOF_functionalizer.py +1648 -0
- molSimplify/Informatics/MOF/PBC_functions.py +1347 -0
- molSimplify/Informatics/MOF/__init__.py +0 -0
- molSimplify/Informatics/MOF/atomic.py +267 -0
- molSimplify/Informatics/MOF/cluster_extraction.py +388 -0
- molSimplify/Informatics/MOF/fragment_MOFs_for_pormake.py +895 -0
- molSimplify/Informatics/MOF/monofunctionalized_BDC/index_information.py +10 -0
- molSimplify/Informatics/Mol2Parser.py +46 -0
- molSimplify/Informatics/RACassemble.py +408 -0
- molSimplify/Informatics/__init__.py +0 -0
- molSimplify/Informatics/active_learning/__init__.py +0 -0
- molSimplify/Informatics/active_learning/expected_improvement.py +269 -0
- molSimplify/Informatics/autocorrelation.py +1930 -0
- molSimplify/Informatics/clean_autocorrelation.py +778 -0
- molSimplify/Informatics/coulomb_analyze.py +67 -0
- molSimplify/Informatics/decoration_manager.py +193 -0
- molSimplify/Informatics/geo_analyze.py +88 -0
- molSimplify/Informatics/geometrics.py +56 -0
- molSimplify/Informatics/graph_analyze.py +163 -0
- molSimplify/Informatics/graph_racs.py +288 -0
- molSimplify/Informatics/jupyter_vis.py +172 -0
- molSimplify/Informatics/lacRACAssemble.py +2192 -0
- molSimplify/Informatics/lacRACAssemble_bisdithiolenes.py +236 -0
- molSimplify/Informatics/misc_descriptors.py +198 -0
- molSimplify/Informatics/organic_fingerprints.py +61 -0
- molSimplify/Informatics/partialcharges.py +345 -0
- molSimplify/Informatics/protein/activesite.py +53 -0
- molSimplify/Informatics/protein/pymol_add_hs.py +33 -0
- molSimplify/Informatics/rac155_geo.py +48 -0
- molSimplify/Ligands/(1_methylbenzimidazol_2_yl)pyridine.xyz +45 -0
- molSimplify/Ligands/1-4-dimethyl-1-2-3-triazole.xyz +15 -0
- molSimplify/Ligands/12crown4.mol +62 -0
- molSimplify/Ligands/Antipyrine.mol +58 -0
- molSimplify/Ligands/BPAbipy.mol +106 -0
- molSimplify/Ligands/Hpyrrole.mol +26 -0
- molSimplify/Ligands/N-quinolinylbutyramidate.xyz +31 -0
- molSimplify/Ligands/N-quinolinylmethylmethinylacetamidate.xyz +30 -0
- molSimplify/Ligands/NMe2_-1.xyz +11 -0
- molSimplify/Ligands/PCy3.mol +111 -0
- molSimplify/Ligands/PMe3.xyz +15 -0
- molSimplify/Ligands/PPh3.mol +76 -0
- molSimplify/Ligands/Propyphenazone.mol +77 -0
- molSimplify/Ligands/acac.mol +33 -0
- molSimplify/Ligands/acacen.mol +76 -0
- molSimplify/Ligands/acetate.smi +1 -0
- molSimplify/Ligands/acetate.xyz +9 -0
- molSimplify/Ligands/aceticacidbipyridine.mol +70 -0
- molSimplify/Ligands/acetonitrile.mol +17 -0
- molSimplify/Ligands/alanine.mol +30 -0
- molSimplify/Ligands/alphabetizer.py +21 -0
- molSimplify/Ligands/amine.mol +11 -0
- molSimplify/Ligands/ammonia.mol +12 -0
- molSimplify/Ligands/arginine.mol +58 -0
- molSimplify/Ligands/asparagine.mol +38 -0
- molSimplify/Ligands/aspartic_acid.mol +35 -0
- molSimplify/Ligands/azide.mol +11 -0
- molSimplify/Ligands/benzene.mol +28 -0
- molSimplify/Ligands/benzene_pi.mol +30 -0
- molSimplify/Ligands/benzenedithiol.mol +30 -0
- molSimplify/Ligands/benzenethiol.mol +30 -0
- molSimplify/Ligands/benzylisocy.mol +38 -0
- molSimplify/Ligands/bidiazine.mol +42 -0
- molSimplify/Ligands/bidiazole.mol +38 -0
- molSimplify/Ligands/bifuran.mol +38 -0
- molSimplify/Ligands/bihydrodiazine.mol +58 -0
- molSimplify/Ligands/bihydrodiazole.mol +46 -0
- molSimplify/Ligands/bihydrooxazine.mol +54 -0
- molSimplify/Ligands/bihydrooxazole.mol +42 -0
- molSimplify/Ligands/bihydrothiazine.mol +54 -0
- molSimplify/Ligands/bihydrothiazole.mol +42 -0
- molSimplify/Ligands/biimidazole.mol +38 -0
- molSimplify/Ligands/bioxazole.mol +34 -0
- molSimplify/Ligands/bipy.mol +46 -0
- molSimplify/Ligands/bipyrazine.xyz +20 -0
- molSimplify/Ligands/bipyrimidine.mol +42 -0
- molSimplify/Ligands/bipyrrole.mol +42 -0
- molSimplify/Ligands/bisnapthyridylpyridine.mol +111 -0
- molSimplify/Ligands/bithiazole.mol +34 -0
- molSimplify/Ligands/bromide.mol +7 -0
- molSimplify/Ligands/bromide.smi +1 -0
- molSimplify/Ligands/c2.mol +9 -0
- molSimplify/Ligands/caprolactone.mol +41 -0
- molSimplify/Ligands/carbonyl.mol +8 -0
- molSimplify/Ligands/carboxyl.mol +13 -0
- molSimplify/Ligands/cat.mol +30 -0
- molSimplify/Ligands/chloride.mol +7 -0
- molSimplify/Ligands/chloride.smi +1 -0
- molSimplify/Ligands/chloropyridine.mol +27 -0
- molSimplify/Ligands/co2.mol +10 -0
- molSimplify/Ligands/corrolazine.mol +72 -0
- molSimplify/Ligands/cs.mol +8 -0
- molSimplify/Ligands/cyanate.xyz +5 -0
- molSimplify/Ligands/cyanide.mol +9 -0
- molSimplify/Ligands/cyanoaceticporphyrin.mol +114 -0
- molSimplify/Ligands/cyanopyridine.mol +29 -0
- molSimplify/Ligands/cyclam.mol +81 -0
- molSimplify/Ligands/cyclen.mol +69 -0
- molSimplify/Ligands/cyclopentadienyl.mol +26 -0
- molSimplify/Ligands/cysteine.mol +32 -0
- molSimplify/Ligands/diaminomethyl.mol +19 -0
- molSimplify/Ligands/diazine.mol +25 -0
- molSimplify/Ligands/diazole.mol +23 -0
- molSimplify/Ligands/dicyanamide.mol +15 -0
- molSimplify/Ligands/dihydrofuran.mol +27 -0
- molSimplify/Ligands/dmap.xyz +35 -0
- molSimplify/Ligands/dmf.mol +28 -0
- molSimplify/Ligands/dmi.mol +41 -0
- molSimplify/Ligands/dmpe.mol +52 -0
- molSimplify/Ligands/dpmu.mol +47 -0
- molSimplify/Ligands/dppe.mol +112 -0
- molSimplify/Ligands/edta.mol +69 -0
- molSimplify/Ligands/en.mol +28 -0
- molSimplify/Ligands/ethanethiol.mol +21 -0
- molSimplify/Ligands/ethanolamine.mol +26 -0
- molSimplify/Ligands/ethbipy.mol +70 -0
- molSimplify/Ligands/ethyl.mol +19 -0
- molSimplify/Ligands/ethylamine.mol +24 -0
- molSimplify/Ligands/ethylene.mol +16 -0
- molSimplify/Ligands/ethylesteracac.mol +57 -0
- molSimplify/Ligands/fluoride.mol +7 -0
- molSimplify/Ligands/fluoride.smi +1 -0
- molSimplify/Ligands/formaldehyde.mol +12 -0
- molSimplify/Ligands/formamidate.xyz +8 -0
- molSimplify/Ligands/formate.xyz +6 -0
- molSimplify/Ligands/furan.mol +23 -0
- molSimplify/Ligands/glutamic_acid.mol +42 -0
- molSimplify/Ligands/glutamine.mol +44 -0
- molSimplify/Ligands/glycinate.mol +23 -0
- molSimplify/Ligands/glycine.mol +24 -0
- molSimplify/Ligands/h2s.mol +10 -0
- molSimplify/Ligands/helium.mol +6 -0
- molSimplify/Ligands/histidine.mol +45 -0
- molSimplify/Ligands/hmpa.mol +62 -0
- molSimplify/Ligands/hs-.mol +9 -0
- molSimplify/Ligands/hydride.mol +7 -0
- molSimplify/Ligands/hydrocarboxyacetylide.xyz +8 -0
- molSimplify/Ligands/hydrocyanide.mol +10 -0
- molSimplify/Ligands/hydrodiazine.mol +33 -0
- molSimplify/Ligands/hydrodiazole.mol +27 -0
- molSimplify/Ligands/hydrogensulfide.mol +10 -0
- molSimplify/Ligands/hydroisocyanide.mol +11 -0
- molSimplify/Ligands/hydrooxazine.mol +31 -0
- molSimplify/Ligands/hydrooxazole.mol +25 -0
- molSimplify/Ligands/hydrothiazine.mol +31 -0
- molSimplify/Ligands/hydrothiazole.mol +25 -0
- molSimplify/Ligands/hydroxyl.mol +9 -0
- molSimplify/Ligands/imidazole.mol +23 -0
- molSimplify/Ligands/imidazolidinone.mol +29 -0
- molSimplify/Ligands/imine.mol +13 -0
- molSimplify/Ligands/iminodiacetic.mol +33 -0
- molSimplify/Ligands/iodide.mol +7 -0
- molSimplify/Ligands/iodobenzene.xyz +14 -0
- molSimplify/Ligands/isoleucine.mol +48 -0
- molSimplify/Ligands/isothiocyanate.mol +11 -0
- molSimplify/Ligands/leucine.mol +48 -0
- molSimplify/Ligands/ligands.dict +257 -0
- molSimplify/Ligands/lysine.mol +54 -0
- molSimplify/Ligands/mebenzenedithiol.mol +36 -0
- molSimplify/Ligands/mebim_py.xyz +29 -0
- molSimplify/Ligands/mebim_pz.xyz +28 -0
- molSimplify/Ligands/mebipy.mol +58 -0
- molSimplify/Ligands/mecat.mol +36 -0
- molSimplify/Ligands/methanal.mol +11 -0
- molSimplify/Ligands/methanethiol.mol +15 -0
- molSimplify/Ligands/methanol.mol +16 -0
- molSimplify/Ligands/methionine.mol +44 -0
- molSimplify/Ligands/methyl.mol +13 -0
- molSimplify/Ligands/methylacetylide.xyz +8 -0
- molSimplify/Ligands/methylamine.mol +19 -0
- molSimplify/Ligands/methylazide.xyz +9 -0
- molSimplify/Ligands/methylisocy.mol +17 -0
- molSimplify/Ligands/methylpyridine.mol +33 -0
- molSimplify/Ligands/n2.mol +8 -0
- molSimplify/Ligands/n4py.xyz +51 -0
- molSimplify/Ligands/nch.mol +10 -0
- molSimplify/Ligands/nco-.mol +11 -0
- molSimplify/Ligands/nethanolamine.mol +26 -0
- molSimplify/Ligands/nitrate.mol +14 -0
- molSimplify/Ligands/nitrite.mol +11 -0
- molSimplify/Ligands/nitro.mol +11 -0
- molSimplify/Ligands/nitrobipy.mol +54 -0
- molSimplify/Ligands/nitroso.mol +8 -0
- molSimplify/Ligands/nme3.mol +30 -0
- molSimplify/Ligands/no-.mol +10 -0
- molSimplify/Ligands/no2-.mol +11 -0
- molSimplify/Ligands/noxygen.mol +8 -0
- molSimplify/Ligands/ns-.mol +10 -0
- molSimplify/Ligands/o-pyridylbenzene.xyz +23 -0
- molSimplify/Ligands/o-pyridylphenylanion.xyz +22 -0
- molSimplify/Ligands/o2-.mol +9 -0
- molSimplify/Ligands/o2.xyz +4 -0
- molSimplify/Ligands/och2.mol +12 -0
- molSimplify/Ligands/oethanolamine.mol +26 -0
- molSimplify/Ligands/ome2.mol +22 -0
- molSimplify/Ligands/ooh.xyz +5 -0
- molSimplify/Ligands/oxalate.mol +17 -0
- molSimplify/Ligands/oxalate.smi +1 -0
- molSimplify/Ligands/oxygen.mol +7 -0
- molSimplify/Ligands/pentacyanocyclopentadienide.mol +36 -0
- molSimplify/Ligands/ph2-.mol +11 -0
- molSimplify/Ligands/ph3.mol +12 -0
- molSimplify/Ligands/phen.mol +51 -0
- molSimplify/Ligands/phenacac.mol +63 -0
- molSimplify/Ligands/phenalalanine.mol +51 -0
- molSimplify/Ligands/phendione.mol +51 -0
- molSimplify/Ligands/phenphen.mol +75 -0
- molSimplify/Ligands/phenylbenzoxazole.mol +54 -0
- molSimplify/Ligands/phenylcyc.mol +99 -0
- molSimplify/Ligands/phenylenediamine.mol +37 -0
- molSimplify/Ligands/phenylisocy.mol +32 -0
- molSimplify/Ligands/phosacidbipy.mol +66 -0
- molSimplify/Ligands/phosphine.mol +13 -0
- molSimplify/Ligands/phosphorine.mol +27 -0
- molSimplify/Ligands/phosphorustrifluoride.mol +12 -0
- molSimplify/Ligands/phthalocyanine.mol +126 -0
- molSimplify/Ligands/pme3o.mol +32 -0
- molSimplify/Ligands/porphyrin.mol +82 -0
- molSimplify/Ligands/pph3o.mol +77 -0
- molSimplify/Ligands/proline.mol +39 -0
- molSimplify/Ligands/propdiol.mol +21 -0
- molSimplify/Ligands/propylene.mol +23 -0
- molSimplify/Ligands/pyridine.mol +27 -0
- molSimplify/Ligands/pyrimidone.mol +27 -0
- molSimplify/Ligands/pyrrole.mol +24 -0
- molSimplify/Ligands/quinoxalinedithiol.mol +39 -0
- molSimplify/Ligands/s2-.mol +9 -0
- molSimplify/Ligands/salen.mol +75 -0
- molSimplify/Ligands/salphen.mol +84 -0
- molSimplify/Ligands/serine.mol +32 -0
- molSimplify/Ligands/simple_ligands.dict +14 -0
- molSimplify/Ligands/sulfacidbipy.mol +63 -0
- molSimplify/Ligands/tbucat.mol +54 -0
- molSimplify/Ligands/tbuphisocy.mol +56 -0
- molSimplify/Ligands/tbutylcyclen.mol +166 -0
- molSimplify/Ligands/tbutylisocy.mol +35 -0
- molSimplify/Ligands/tbutylthiol.mol +33 -0
- molSimplify/Ligands/tcnoet.mol +43 -0
- molSimplify/Ligands/tcnoetOH.mol +45 -0
- molSimplify/Ligands/terpy.mol +65 -0
- molSimplify/Ligands/tetrahydrofuran.mol +31 -0
- molSimplify/Ligands/thiane.mol +37 -0
- molSimplify/Ligands/thiazole.mol +21 -0
- molSimplify/Ligands/thiocyanate.mol +11 -0
- molSimplify/Ligands/thiol.mol +9 -0
- molSimplify/Ligands/thiophene.mol +23 -0
- molSimplify/Ligands/thiopyridine.mol +29 -0
- molSimplify/Ligands/threonine.mol +38 -0
- molSimplify/Ligands/tpp.mol +165 -0
- molSimplify/Ligands/tricyanomethyl.mol +19 -0
- molSimplify/Ligands/trifluoromethyl.mol +13 -0
- molSimplify/Ligands/tryptophan.mol +60 -0
- molSimplify/Ligands/tyrosine.mol +53 -0
- molSimplify/Ligands/uthiol.mol +11 -0
- molSimplify/Ligands/uthiolme2.mol +23 -0
- molSimplify/Ligands/valine.mol +42 -0
- molSimplify/Ligands/water.mol +10 -0
- molSimplify/Ligands/x.mol +6 -0
- molSimplify/Scripts/__init__.py +0 -0
- molSimplify/Scripts/addtodb.py +308 -0
- molSimplify/Scripts/cellbuilder.py +1592 -0
- molSimplify/Scripts/cellbuilder_tools.py +701 -0
- molSimplify/Scripts/chains.py +342 -0
- molSimplify/Scripts/convert_2to3.py +23 -0
- molSimplify/Scripts/dbinteract.py +631 -0
- molSimplify/Scripts/distgeom.py +617 -0
- molSimplify/Scripts/findcorrelations.py +287 -0
- molSimplify/Scripts/generator.py +267 -0
- molSimplify/Scripts/geometry.py +1224 -0
- molSimplify/Scripts/grabguivars.py +845 -0
- molSimplify/Scripts/in_b3lyp_usetc.py +141 -0
- molSimplify/Scripts/inparse.py +1673 -0
- molSimplify/Scripts/io.py +1149 -0
- molSimplify/Scripts/isomers.py +415 -0
- molSimplify/Scripts/jobgen.py +247 -0
- molSimplify/Scripts/krr_prep.py +1262 -0
- molSimplify/Scripts/molSimplify_io.py +18 -0
- molSimplify/Scripts/molden2psi4wfn.py +166 -0
- molSimplify/Scripts/namegen.py +32 -0
- molSimplify/Scripts/nn_prep.py +561 -0
- molSimplify/Scripts/oct_check_mols.py +782 -0
- molSimplify/Scripts/periodic_QE.py +97 -0
- molSimplify/Scripts/postmold.py +304 -0
- molSimplify/Scripts/postmwfn.py +709 -0
- molSimplify/Scripts/postparse.py +488 -0
- molSimplify/Scripts/postproc.py +139 -0
- molSimplify/Scripts/qcgen.py +1450 -0
- molSimplify/Scripts/rmsd.py +489 -0
- molSimplify/Scripts/rungen.py +670 -0
- molSimplify/Scripts/structgen.py +3040 -0
- molSimplify/Scripts/tf_nn_prep.py +894 -0
- molSimplify/Scripts/tsgen.py +295 -0
- molSimplify/Scripts/uq_calibration.py +69 -0
- molSimplify/__init__.py +0 -0
- molSimplify/__main__.py +197 -0
- molSimplify/icons/chemdb.png +0 -0
- molSimplify/icons/hjklogo.png +0 -0
- molSimplify/icons/icon.png +0 -0
- molSimplify/icons/logo.png +0 -0
- molSimplify/icons/logo_old.png +0 -0
- molSimplify/icons/petachem.png +0 -0
- molSimplify/icons/petachem2.png +0 -0
- molSimplify/icons/petachem_full.png +0 -0
- molSimplify/icons/pythonlogo.png +0 -0
- molSimplify/icons/sge copy.png +0 -0
- molSimplify/icons/sge.png +0 -0
- molSimplify/icons/slurm.png +0 -0
- molSimplify/icons/wft1.png +0 -0
- molSimplify/icons/wft2.png +0 -0
- molSimplify/icons/wft3.png +0 -0
- molSimplify/ml/__init__.py +0 -0
- molSimplify/ml/kernels.py +36 -0
- molSimplify/ml/layers.py +29 -0
- molSimplify/molscontrol/__init__.py +14 -0
- molSimplify/molscontrol/_version.py +521 -0
- molSimplify/molscontrol/clf_tools.py +144 -0
- molSimplify/molscontrol/data/README.md +21 -0
- molSimplify/molscontrol/data/look_and_say.dat +15 -0
- molSimplify/molscontrol/dynamic_classifier.py +514 -0
- molSimplify/molscontrol/io_tools.py +363 -0
- molSimplify/molscontrol/molscontrol.py +49 -0
- molSimplify/molscontrol/terachem/jobscript_control.sh +31 -0
- molSimplify/molscontrol/terachem/terachem_input +22 -0
- molSimplify/python_krr/X_train_TS.csv +535 -0
- molSimplify/python_krr/__init__.py +0 -0
- molSimplify/python_krr/hat2_X_mean_std.csv +3 -0
- molSimplify/python_krr/hat2_feature_names.csv +1 -0
- molSimplify/python_krr/hat2_y_mean_std.csv +2 -0
- molSimplify/python_krr/hat_X_mean_std.csv +6 -0
- molSimplify/python_krr/hat_feature_names.csv +1 -0
- molSimplify/python_krr/hat_krr_X_train.csv +5205 -0
- molSimplify/python_krr/hat_krr_dual_coef.csv +1 -0
- molSimplify/python_krr/hat_y_mean_std.csv +2 -0
- molSimplify/python_krr/sklearn_models.py +34 -0
- molSimplify/python_krr/y_train_TS.csv +535 -0
- molSimplify/python_nn/ANN.py +198 -0
- molSimplify/python_nn/__init__.py +0 -0
- molSimplify/python_nn/clf_analysis_tool.py +125 -0
- molSimplify/python_nn/dictionary_toolbox.py +49 -0
- molSimplify/python_nn/ensemble_test.py +309 -0
- molSimplify/python_nn/hs_center.csv +26 -0
- molSimplify/python_nn/hs_scale.csv +26 -0
- molSimplify/python_nn/ls_center.csv +26 -0
- molSimplify/python_nn/ls_scale.csv +26 -0
- molSimplify/python_nn/ms_hs_b1.csv +50 -0
- molSimplify/python_nn/ms_hs_b2.csv +50 -0
- molSimplify/python_nn/ms_hs_b3.csv +1 -0
- molSimplify/python_nn/ms_hs_w1.csv +50 -0
- molSimplify/python_nn/ms_hs_w2.csv +50 -0
- molSimplify/python_nn/ms_hs_w3.csv +1 -0
- molSimplify/python_nn/ms_ls_b1.csv +50 -0
- molSimplify/python_nn/ms_ls_b2.csv +50 -0
- molSimplify/python_nn/ms_ls_b3.csv +1 -0
- molSimplify/python_nn/ms_ls_w1.csv +50 -0
- molSimplify/python_nn/ms_ls_w2.csv +50 -0
- molSimplify/python_nn/ms_ls_w3.csv +1 -0
- molSimplify/python_nn/ms_slope_b1.csv +50 -0
- molSimplify/python_nn/ms_slope_b2.csv +50 -0
- molSimplify/python_nn/ms_slope_b3.csv +1 -0
- molSimplify/python_nn/ms_slope_w1.csv +50 -0
- molSimplify/python_nn/ms_slope_w2.csv +50 -0
- molSimplify/python_nn/ms_slope_w3.csv +1 -0
- molSimplify/python_nn/ms_split_b1.csv +50 -0
- molSimplify/python_nn/ms_split_b2.csv +50 -0
- molSimplify/python_nn/ms_split_b3.csv +1 -0
- molSimplify/python_nn/ms_split_w1.csv +50 -0
- molSimplify/python_nn/ms_split_w2.csv +50 -0
- molSimplify/python_nn/ms_split_w3.csv +1 -0
- molSimplify/python_nn/slope_center.csv +25 -0
- molSimplify/python_nn/slope_scale.csv +25 -0
- molSimplify/python_nn/split_center.csv +26 -0
- molSimplify/python_nn/split_scale.csv +26 -0
- molSimplify/python_nn/tf_ANN.py +762 -0
- molSimplify/python_nn/train_data.csv +1211 -0
- molSimplify/tf_nn/__init__.py +0 -0
- molSimplify/tf_nn/geo_static_clf/geo_static_clf_model.h5 +0 -0
- molSimplify/tf_nn/geo_static_clf/geo_static_clf_train_name.csv +1591 -0
- molSimplify/tf_nn/geo_static_clf/geo_static_clf_train_x.csv +2790 -0
- molSimplify/tf_nn/geo_static_clf/geo_static_clf_train_y.csv +2790 -0
- molSimplify/tf_nn/geo_static_clf/geo_static_clf_vars.csv +154 -0
- molSimplify/tf_nn/geos/hs_ii_bl_x.csv +1577 -0
- molSimplify/tf_nn/geos/hs_ii_bl_y.csv +1577 -0
- molSimplify/tf_nn/geos/hs_ii_model.h5 +0 -0
- molSimplify/tf_nn/geos/hs_ii_model.json +1 -0
- molSimplify/tf_nn/geos/hs_ii_vars.csv +154 -0
- molSimplify/tf_nn/geos/hs_iii_bl_x.csv +1659 -0
- molSimplify/tf_nn/geos/hs_iii_bl_y.csv +1659 -0
- molSimplify/tf_nn/geos/hs_iii_model.h5 +0 -0
- molSimplify/tf_nn/geos/hs_iii_model.json +1 -0
- molSimplify/tf_nn/geos/hs_iii_vars.csv +154 -0
- molSimplify/tf_nn/geos/ls_ii_bl_x.csv +1374 -0
- molSimplify/tf_nn/geos/ls_ii_bl_y.csv +1374 -0
- molSimplify/tf_nn/geos/ls_ii_model.h5 +0 -0
- molSimplify/tf_nn/geos/ls_ii_model.json +1 -0
- molSimplify/tf_nn/geos/ls_ii_vars.csv +154 -0
- molSimplify/tf_nn/geos/ls_iii_bl_x.csv +1364 -0
- molSimplify/tf_nn/geos/ls_iii_bl_y.csv +1364 -0
- molSimplify/tf_nn/geos/ls_iii_model.h5 +0 -0
- molSimplify/tf_nn/geos/ls_iii_model.json +1 -0
- molSimplify/tf_nn/geos/ls_iii_vars.csv +154 -0
- molSimplify/tf_nn/homolumo/gap_model.h5 +0 -0
- molSimplify/tf_nn/homolumo/gap_model.json +1 -0
- molSimplify/tf_nn/homolumo/gap_test_names.csv +175 -0
- molSimplify/tf_nn/homolumo/gap_test_x.csv +176 -0
- molSimplify/tf_nn/homolumo/gap_test_y.csv +176 -0
- molSimplify/tf_nn/homolumo/gap_train_names.csv +699 -0
- molSimplify/tf_nn/homolumo/gap_train_x.csv +700 -0
- molSimplify/tf_nn/homolumo/gap_train_y.csv +700 -0
- molSimplify/tf_nn/homolumo/gap_vars.csv +153 -0
- molSimplify/tf_nn/homolumo/homo_model.h5 +0 -0
- molSimplify/tf_nn/homolumo/homo_model.json +126 -0
- molSimplify/tf_nn/homolumo/homo_test_names.csv +175 -0
- molSimplify/tf_nn/homolumo/homo_test_x.csv +176 -0
- molSimplify/tf_nn/homolumo/homo_test_y.csv +176 -0
- molSimplify/tf_nn/homolumo/homo_train_names.csv +699 -0
- molSimplify/tf_nn/homolumo/homo_train_x.csv +700 -0
- molSimplify/tf_nn/homolumo/homo_train_y.csv +700 -0
- molSimplify/tf_nn/homolumo/homo_vars.csv +153 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_info.json +7 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_model.h5 +0 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_model.json +1 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_test_names.csv +143 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_test_x.csv +144 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_test_y.csv +144 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_train_names.csv +513 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_train_x.csv +514 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_train_y.csv +514 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_val_names.csv +143 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_val_x.csv +58 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_val_y.csv +58 -0
- molSimplify/tf_nn/oxoandhomo/homo_empty_vars.csv +155 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_info.json +7 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_model.h5 +0 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_model.json +1 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_test_names.csv +143 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_test_x.csv +144 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_test_y.csv +144 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_train_names.csv +513 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_train_x.csv +514 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_train_y.csv +514 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_val_names.csv +143 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_val_x.csv +58 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_val_y.csv +58 -0
- molSimplify/tf_nn/oxoandhomo/oxo20_vars.csv +154 -0
- molSimplify/tf_nn/oxocatalysis/hat_model.h5 +0 -0
- molSimplify/tf_nn/oxocatalysis/hat_model.json +1 -0
- molSimplify/tf_nn/oxocatalysis/hat_test_names.csv +419 -0
- molSimplify/tf_nn/oxocatalysis/hat_test_x.csv +420 -0
- molSimplify/tf_nn/oxocatalysis/hat_test_y.csv +420 -0
- molSimplify/tf_nn/oxocatalysis/hat_train_names.csv +1507 -0
- molSimplify/tf_nn/oxocatalysis/hat_train_x.csv +1508 -0
- molSimplify/tf_nn/oxocatalysis/hat_train_y.csv +1508 -0
- molSimplify/tf_nn/oxocatalysis/hat_val_x.csv +169 -0
- molSimplify/tf_nn/oxocatalysis/hat_val_y.csv +169 -0
- molSimplify/tf_nn/oxocatalysis/hat_vars.csv +162 -0
- molSimplify/tf_nn/oxocatalysis/oxo_model.h5 +0 -0
- molSimplify/tf_nn/oxocatalysis/oxo_model.json +1 -0
- molSimplify/tf_nn/oxocatalysis/oxo_test_names.csv +527 -0
- molSimplify/tf_nn/oxocatalysis/oxo_test_x.csv +528 -0
- molSimplify/tf_nn/oxocatalysis/oxo_test_y.csv +528 -0
- molSimplify/tf_nn/oxocatalysis/oxo_train_names.csv +1897 -0
- molSimplify/tf_nn/oxocatalysis/oxo_train_x.csv +1898 -0
- molSimplify/tf_nn/oxocatalysis/oxo_train_y.csv +1898 -0
- molSimplify/tf_nn/oxocatalysis/oxo_val_x.csv +212 -0
- molSimplify/tf_nn/oxocatalysis/oxo_val_y.csv +212 -0
- molSimplify/tf_nn/oxocatalysis/oxo_vars.csv +162 -0
- molSimplify/tf_nn/rescaling_data/gap_mean_x.csv +153 -0
- molSimplify/tf_nn/rescaling_data/gap_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/gap_var_x.csv +153 -0
- molSimplify/tf_nn/rescaling_data/gap_var_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/geo_static_clf_mean_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/geo_static_clf_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/geo_static_clf_var_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/geo_static_clf_var_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/hat_mean_x.csv +162 -0
- molSimplify/tf_nn/rescaling_data/hat_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/hat_var_x.csv +162 -0
- molSimplify/tf_nn/rescaling_data/hat_var_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/homo_empty_mean_x.csv +155 -0
- molSimplify/tf_nn/rescaling_data/homo_empty_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/homo_empty_var_x.csv +155 -0
- molSimplify/tf_nn/rescaling_data/homo_empty_var_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/homo_mean_x.csv +153 -0
- molSimplify/tf_nn/rescaling_data/homo_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/homo_var_x.csv +153 -0
- molSimplify/tf_nn/rescaling_data/homo_var_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/hs_ii_mean_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/hs_ii_mean_y.csv +3 -0
- molSimplify/tf_nn/rescaling_data/hs_ii_var_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/hs_ii_var_y.csv +3 -0
- molSimplify/tf_nn/rescaling_data/hs_iii_mean_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/hs_iii_mean_y.csv +3 -0
- molSimplify/tf_nn/rescaling_data/hs_iii_var_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/hs_iii_var_y.csv +3 -0
- molSimplify/tf_nn/rescaling_data/ls_ii_mean_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/ls_ii_mean_y.csv +3 -0
- molSimplify/tf_nn/rescaling_data/ls_ii_var_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/ls_ii_var_y.csv +3 -0
- molSimplify/tf_nn/rescaling_data/ls_iii_mean_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/ls_iii_mean_y.csv +3 -0
- molSimplify/tf_nn/rescaling_data/ls_iii_var_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/ls_iii_var_y.csv +3 -0
- molSimplify/tf_nn/rescaling_data/oxo20_mean_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/oxo20_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/oxo20_var_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/oxo20_var_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/oxo_mean_x.csv +162 -0
- molSimplify/tf_nn/rescaling_data/oxo_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/oxo_var_x.csv +162 -0
- molSimplify/tf_nn/rescaling_data/oxo_var_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/sc_static_clf_mean_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/sc_static_clf_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/sc_static_clf_var_x.csv +154 -0
- molSimplify/tf_nn/rescaling_data/sc_static_clf_var_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/split_mean_x.csv +155 -0
- molSimplify/tf_nn/rescaling_data/split_mean_y.csv +1 -0
- molSimplify/tf_nn/rescaling_data/split_var_x.csv +155 -0
- molSimplify/tf_nn/rescaling_data/split_var_y.csv +1 -0
- molSimplify/tf_nn/sc_static_clf/sc_static_clf_model.h5 +0 -0
- molSimplify/tf_nn/sc_static_clf/sc_static_clf_train_name.csv +1591 -0
- molSimplify/tf_nn/sc_static_clf/sc_static_clf_train_x.csv +1592 -0
- molSimplify/tf_nn/sc_static_clf/sc_static_clf_train_y.csv +1592 -0
- molSimplify/tf_nn/sc_static_clf/sc_static_clf_vars.csv +154 -0
- molSimplify/tf_nn/split/split_model.h5 +0 -0
- molSimplify/tf_nn/split/split_model.json +1 -0
- molSimplify/tf_nn/split/split_vars.csv +155 -0
- molSimplify/tf_nn/split/split_x.csv +1902 -0
- molSimplify/tf_nn/split/split_y.csv +1902 -0
- molSimplify/tf_nn/split/train_names.csv +1901 -0
- molSimplify/utils/__init__.py +0 -0
- molSimplify/utils/decorators.py +16 -0
- molSimplify/utils/metaclasses.py +12 -0
- molSimplify/utils/tensorflow.py +23 -0
- molSimplify/utils/timer.py +16 -0
- molSimplify-1.7.4.dist-info/LICENSE +674 -0
- molSimplify-1.7.4.dist-info/METADATA +821 -0
- molSimplify-1.7.4.dist-info/RECORD +651 -0
- molSimplify-1.7.4.dist-info/WHEEL +5 -0
- molSimplify-1.7.4.dist-info/entry_points.txt +3 -0
- molSimplify-1.7.4.dist-info/top_level.txt +4 -0
- tests/generateTests.py +122 -0
- tests/helperFuncs.py +658 -0
- tests/informatics/test_MOF_descriptors.py +128 -0
- tests/informatics/test_active_learning.py +113 -0
- tests/informatics/test_coulomb_analyze.py +24 -0
- tests/informatics/test_graph_racs.py +193 -0
- tests/ml/test_kernels.py +20 -0
- tests/ml/test_layers.py +47 -0
- tests/runtest.py +10 -0
- tests/test_Mol2D.py +128 -0
- tests/test_basic_imports.py +62 -0
- tests/test_bidentate.py +25 -0
- tests/test_cli.py +20 -0
- tests/test_distgeom.py +106 -0
- tests/test_example_1.py +29 -0
- tests/test_example_3.py +31 -0
- tests/test_example_5.py +43 -0
- tests/test_example_7.py +28 -0
- tests/test_example_8.py +15 -0
- tests/test_example_tbp.py +15 -0
- tests/test_ff_xtb.py +111 -0
- tests/test_geocheck_oct.py +26 -0
- tests/test_geocheck_one_empty.py +15 -0
- tests/test_geometry.py +44 -0
- tests/test_inparse.py +76 -0
- tests/test_io.py +84 -0
- tests/test_jobgen.py +84 -0
- tests/test_joption_pythonic.py +27 -0
- tests/test_ligand_assign.py +58 -0
- tests/test_ligand_assign_consistent.py +60 -0
- tests/test_ligand_class.py +26 -0
- tests/test_ligand_from_mol_file.py +35 -0
- tests/test_ligands.py +86 -0
- tests/test_mol3D.py +337 -0
- tests/test_molcas_caspt2.py +15 -0
- tests/test_molcas_casscf.py +15 -0
- tests/test_old_ANNs.py +68 -0
- tests/test_orca_ccsdt.py +15 -0
- tests/test_orca_dft.py +15 -0
- tests/test_qcgen.py +50 -0
- tests/test_racs.py +124 -0
- tests/test_rmsd.py +68 -0
- tests/test_structgen_functions.py +198 -0
- tests/test_tetrahedral.py +29 -0
- tests/test_tutorial_10_part_one.py +16 -0
- tests/test_tutorial_10_part_two.py +15 -0
- tests/test_tutorial_2.py +11 -0
- tests/test_tutorial_3.py +15 -0
- tests/test_tutorial_4.py +57 -0
- tests/test_tutorial_6.py +10 -0
- tests/test_tutorial_8.py +29 -0
- tests/test_tutorial_9_part_one.py +15 -0
- tests/test_tutorial_9_part_two.py +15 -0
- tests/test_tutorial_qm9_part_one.py +6 -0
- tests/testresources/refs/racs/generate_references.py +85 -0
- workflows/NandyJACSAu2022/bridge_functionalizer.py +253 -0
- workflows/NandyJACSAu2022/frag_functionalizer.py +242 -0
- workflows/NandyJACSAu2022/fragment_classes.py +586 -0
- workflows/NandyJACSAu2022/macrocycle_synthesis.py +179 -0
|
@@ -0,0 +1,236 @@
|
|
|
1
|
+
from molSimplify.Classes.ligand import ligand_breakdown, ligand
|
|
2
|
+
from molSimplify.Classes.globalvars import globalvars
|
|
3
|
+
from molSimplify.Informatics.lacRACAssemble import (generate_all_ligand_autocorrelations,
|
|
4
|
+
generate_all_ligand_misc,
|
|
5
|
+
append_descriptors,
|
|
6
|
+
generate_metal_deltametrics,
|
|
7
|
+
generate_full_complex_autocorrelations,
|
|
8
|
+
generate_metal_autocorrelations,
|
|
9
|
+
generate_metal_ox_autocorrelations,
|
|
10
|
+
generate_metal_ox_deltametrics,
|
|
11
|
+
generate_all_ligand_deltametrics
|
|
12
|
+
)
|
|
13
|
+
|
|
14
|
+
globs = globalvars()
|
|
15
|
+
|
|
16
|
+
|
|
17
|
+
def lig_assign_bisdithiolene(inmol, liglist, ligdents, ligcons):
|
|
18
|
+
"""[summary]
|
|
19
|
+
|
|
20
|
+
Parameters
|
|
21
|
+
----------
|
|
22
|
+
inmol : mol3D object
|
|
23
|
+
5-coordinate mol3D object
|
|
24
|
+
liglist : list
|
|
25
|
+
see ligand class
|
|
26
|
+
ligdents : list
|
|
27
|
+
see ligand class
|
|
28
|
+
ligcons : list
|
|
29
|
+
[see ligand class
|
|
30
|
+
|
|
31
|
+
Returns
|
|
32
|
+
-------
|
|
33
|
+
ax_ligand_list, eq_ligand_list, ax_con_int_list, eq_con_int_list
|
|
34
|
+
see ligands class
|
|
35
|
+
|
|
36
|
+
Raises
|
|
37
|
+
------
|
|
38
|
+
ValueError
|
|
39
|
+
If unrecognized ligdent.
|
|
40
|
+
"""
|
|
41
|
+
ax_ligand_list = list()
|
|
42
|
+
eq_ligand_list = list()
|
|
43
|
+
ax_con_int_list = list()
|
|
44
|
+
eq_con_int_list = list()
|
|
45
|
+
for i, ligand_indices in enumerate(liglist):
|
|
46
|
+
this_ligand = ligand(inmol, ligand_indices, ligdents[i])
|
|
47
|
+
this_ligand.obtain_mol3d()
|
|
48
|
+
if ligdents[i] == 1:
|
|
49
|
+
ax_con = ligcons[i]
|
|
50
|
+
ax_ligand_list.append(this_ligand)
|
|
51
|
+
current_ligand_index_list = this_ligand.index_list
|
|
52
|
+
ax_con_int_list.append([current_ligand_index_list.index(x) for x in ax_con])
|
|
53
|
+
elif ligdents[i] == 2:
|
|
54
|
+
eq_con = ligcons[i]
|
|
55
|
+
eq_ligand_list.append(this_ligand)
|
|
56
|
+
current_ligand_index_list = this_ligand.index_list
|
|
57
|
+
eq_con_int_list.append([current_ligand_index_list.index(x) for x in eq_con])
|
|
58
|
+
else:
|
|
59
|
+
raise ValueError('Ligdent unknown: ' + str(ligdents[i]))
|
|
60
|
+
return ax_ligand_list, eq_ligand_list, ax_con_int_list, eq_con_int_list
|
|
61
|
+
|
|
62
|
+
|
|
63
|
+
def get_descriptor_vector(this_complex, custom_ligand_dict=False,
|
|
64
|
+
ox_modifier=False, NumB=False, Gval=False,
|
|
65
|
+
lacRACs=True, loud=False, metal_ind=None,
|
|
66
|
+
smiles_charge=False, eq_sym=False,
|
|
67
|
+
use_dist=False, size_normalize=False):
|
|
68
|
+
""" Calculate and return all geo-based RACs for a given octahedral complex (featurize).
|
|
69
|
+
|
|
70
|
+
Parameters
|
|
71
|
+
----------
|
|
72
|
+
this_complex : mol3D
|
|
73
|
+
Transition metal complex to be featurized.
|
|
74
|
+
custom_ligand_dict : bool, optional
|
|
75
|
+
Custom ligand dictionary to evaluate for complex if passed, by default False
|
|
76
|
+
Skip the ligand breakdown steps -
|
|
77
|
+
in cases where 3D geo is not correct/formed
|
|
78
|
+
custom_ligand_dict.keys() must be eq_ligands_list, ax_ligand_list
|
|
79
|
+
ax_con_int_list ,eq_con_int_list
|
|
80
|
+
with types: eq/ax_ligand_list list of mol3D
|
|
81
|
+
eq/ax_con_int_list list of list/tuple of int e.g, [[1,2] [1,2]]
|
|
82
|
+
ox_modifier : bool, optional
|
|
83
|
+
dict, used to modify prop vector (e.g. for adding
|
|
84
|
+
ONLY used with ox_nuclear_charge ox or charge)
|
|
85
|
+
{"Fe":2, "Co": 3} etc, by default False
|
|
86
|
+
NumB : bool, optional
|
|
87
|
+
Use Number of Bonds as additional RAC, by default False
|
|
88
|
+
Gval : bool, optional
|
|
89
|
+
Use group number as RAC, by default False
|
|
90
|
+
lacRACs : bool, optional
|
|
91
|
+
Use ligand_assign_consistent (lac) to represent mol3D given
|
|
92
|
+
if False, use ligand_assign (older), default True
|
|
93
|
+
loud : bool, optional
|
|
94
|
+
Print degubbging information, by default False
|
|
95
|
+
metal_ind : bool, optional
|
|
96
|
+
index of the metal atom to generate property, by default False
|
|
97
|
+
smiles_charge : bool, optional
|
|
98
|
+
use obmol conversion through smiles to assign ligand_misc_charges, by default False
|
|
99
|
+
|
|
100
|
+
Returns
|
|
101
|
+
-------
|
|
102
|
+
descriptor_names : list
|
|
103
|
+
Compiled list of descriptor names
|
|
104
|
+
descriptors : list
|
|
105
|
+
Compiled list of descriptor values
|
|
106
|
+
|
|
107
|
+
"""
|
|
108
|
+
# modifier -
|
|
109
|
+
descriptor_names = []
|
|
110
|
+
descriptors = []
|
|
111
|
+
# Generate custom_ligand_dict if one not passed!
|
|
112
|
+
if not custom_ligand_dict:
|
|
113
|
+
if lacRACs:
|
|
114
|
+
from molSimplify.Classes.ligand import ligand_assign_consistent as ligand_assign
|
|
115
|
+
else:
|
|
116
|
+
from molSimplify.Classes.ligand import ligand_assign as ligand_assign
|
|
117
|
+
liglist, ligdents, ligcons = ligand_breakdown(this_complex, BondedOct=True) # Complex is assumed to be octahedral
|
|
118
|
+
if sum(ligdents) == 6:
|
|
119
|
+
(ax_ligand_list, eq_ligand_list, ax_natoms_list, eq_natoms_list,
|
|
120
|
+
ax_con_int_list, eq_con_int_list, ax_con_list, eq_con_list,
|
|
121
|
+
built_ligand_list) = ligand_assign(this_complex, liglist,
|
|
122
|
+
ligdents, ligcons, loud,
|
|
123
|
+
eq_sym_match=eq_sym)
|
|
124
|
+
custom_ligand_dict = {'ax_ligand_list': ax_ligand_list,
|
|
125
|
+
'eq_ligand_list': eq_ligand_list,
|
|
126
|
+
'ax_con_int_list': ax_con_int_list,
|
|
127
|
+
'eq_con_int_list': eq_con_int_list}
|
|
128
|
+
elif sum(ligdents) == 5:
|
|
129
|
+
(ax_ligand_list, eq_ligand_list,
|
|
130
|
+
ax_con_int_list, eq_con_int_list) = lig_assign_bisdithiolene(
|
|
131
|
+
this_complex, liglist, ligdents, ligcons)
|
|
132
|
+
custom_ligand_dict = {'ax_ligand_list': ax_ligand_list,
|
|
133
|
+
'eq_ligand_list': eq_ligand_list,
|
|
134
|
+
'ax_con_int_list': ax_con_int_list,
|
|
135
|
+
'eq_con_int_list': eq_con_int_list}
|
|
136
|
+
|
|
137
|
+
# misc descriptors
|
|
138
|
+
results_dictionary = generate_all_ligand_misc(this_complex, loud=False,
|
|
139
|
+
custom_ligand_dict=custom_ligand_dict,
|
|
140
|
+
smiles_charge=smiles_charge)
|
|
141
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
142
|
+
results_dictionary['colnames'],
|
|
143
|
+
results_dictionary['result_ax'],
|
|
144
|
+
'misc', 'ax')
|
|
145
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
146
|
+
results_dictionary['colnames'],
|
|
147
|
+
results_dictionary['result_eq'],
|
|
148
|
+
'misc', 'eq')
|
|
149
|
+
|
|
150
|
+
# full ACs
|
|
151
|
+
results_dictionary = generate_full_complex_autocorrelations(this_complex, depth=3, loud=False,
|
|
152
|
+
flag_name=False, modifier=ox_modifier,
|
|
153
|
+
NumB=NumB, Gval=Gval, use_dist=use_dist,
|
|
154
|
+
size_normalize=size_normalize)
|
|
155
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
156
|
+
results_dictionary['colnames'],
|
|
157
|
+
results_dictionary['results'],
|
|
158
|
+
'f', 'all')
|
|
159
|
+
|
|
160
|
+
# ligand ACs
|
|
161
|
+
results_dictionary = generate_all_ligand_autocorrelations(this_complex, depth=3, loud=False,
|
|
162
|
+
flag_name=False,
|
|
163
|
+
custom_ligand_dict=custom_ligand_dict,
|
|
164
|
+
NumB=NumB, Gval=Gval, use_dist=use_dist,
|
|
165
|
+
size_normalize=size_normalize)
|
|
166
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
167
|
+
results_dictionary['colnames'],
|
|
168
|
+
results_dictionary['result_ax_full'],
|
|
169
|
+
'f', 'ax')
|
|
170
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
171
|
+
results_dictionary['colnames'],
|
|
172
|
+
results_dictionary['result_eq_full'],
|
|
173
|
+
'f', 'eq')
|
|
174
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
175
|
+
results_dictionary['colnames'],
|
|
176
|
+
results_dictionary['result_ax_con'],
|
|
177
|
+
'lc', 'ax')
|
|
178
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
179
|
+
results_dictionary['colnames'],
|
|
180
|
+
results_dictionary['result_eq_con'],
|
|
181
|
+
'lc', 'eq')
|
|
182
|
+
|
|
183
|
+
results_dictionary = generate_all_ligand_deltametrics(this_complex, depth=3, loud=False,
|
|
184
|
+
custom_ligand_dict=custom_ligand_dict,
|
|
185
|
+
NumB=NumB, Gval=Gval,
|
|
186
|
+
use_dist=use_dist,
|
|
187
|
+
size_normalize=size_normalize)
|
|
188
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
189
|
+
results_dictionary['colnames'],
|
|
190
|
+
results_dictionary['result_ax_con'],
|
|
191
|
+
'D_lc', 'ax')
|
|
192
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
193
|
+
results_dictionary['colnames'],
|
|
194
|
+
results_dictionary['result_eq_con'],
|
|
195
|
+
'D_lc', 'eq')
|
|
196
|
+
|
|
197
|
+
# metal ACs
|
|
198
|
+
results_dictionary = generate_metal_autocorrelations(this_complex, depth=3, loud=False,
|
|
199
|
+
modifier=ox_modifier, NumB=NumB,
|
|
200
|
+
Gval=Gval, metal_ind=metal_ind,
|
|
201
|
+
use_dist=use_dist,
|
|
202
|
+
size_normalize=size_normalize)
|
|
203
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
204
|
+
results_dictionary['colnames'],
|
|
205
|
+
results_dictionary['results'],
|
|
206
|
+
'mc', 'all')
|
|
207
|
+
|
|
208
|
+
results_dictionary = generate_metal_deltametrics(this_complex, depth=3, loud=False,
|
|
209
|
+
modifier=ox_modifier, NumB=NumB,
|
|
210
|
+
Gval=Gval, metal_ind=metal_ind,
|
|
211
|
+
use_dist=use_dist,
|
|
212
|
+
size_normalize=size_normalize)
|
|
213
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
214
|
+
results_dictionary['colnames'],
|
|
215
|
+
results_dictionary['results'],
|
|
216
|
+
'D_mc', 'all')
|
|
217
|
+
|
|
218
|
+
# ## ox-metal ACs, if ox available
|
|
219
|
+
if ox_modifier:
|
|
220
|
+
results_dictionary = generate_metal_ox_autocorrelations(ox_modifier, this_complex, depth=3,
|
|
221
|
+
loud=False, metal_ind=metal_ind,
|
|
222
|
+
use_dist=use_dist,
|
|
223
|
+
size_normalize=size_normalize)
|
|
224
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
225
|
+
results_dictionary['colnames'],
|
|
226
|
+
results_dictionary['results'],
|
|
227
|
+
'mc', 'all')
|
|
228
|
+
results_dictionary = generate_metal_ox_deltametrics(ox_modifier, this_complex, depth=3,
|
|
229
|
+
loud=False, metal_ind=metal_ind,
|
|
230
|
+
use_dist=use_dist,
|
|
231
|
+
size_normalize=size_normalize)
|
|
232
|
+
descriptor_names, descriptors = append_descriptors(descriptor_names, descriptors,
|
|
233
|
+
results_dictionary['colnames'],
|
|
234
|
+
results_dictionary['results'],
|
|
235
|
+
'D_mc', 'all')
|
|
236
|
+
return descriptor_names, descriptors
|
|
@@ -0,0 +1,198 @@
|
|
|
1
|
+
from molSimplify.Classes.ligand import ligand_breakdown, ligand_assign
|
|
2
|
+
from molSimplify.Informatics.graph_analyze import (get_lig_EN,
|
|
3
|
+
get_truncated_kier,
|
|
4
|
+
kier)
|
|
5
|
+
import numpy as np
|
|
6
|
+
|
|
7
|
+
|
|
8
|
+
def generate_all_ligand_misc(mol, loud, custom_ligand_dict=False, force_legacy=False):
|
|
9
|
+
# custom_ligand_dict.keys() must be eq_ligands_list, ax_ligand_list
|
|
10
|
+
## ax_con_int_list ,eq_con_int_list
|
|
11
|
+
# with types: eq/ax_ligand_list list of mol3D
|
|
12
|
+
# eq/ax_con_int_list list of list/tuple of int e.g, [[1,2] [1,2]]
|
|
13
|
+
# use force_legacy to get kier indices/MCDL
|
|
14
|
+
result_ax = list()
|
|
15
|
+
result_eq = list()
|
|
16
|
+
if force_legacy:
|
|
17
|
+
colnames = ['dent', 'maxDEN', 'ki', 'tki', 'charge']
|
|
18
|
+
else:
|
|
19
|
+
colnames = ['dent', 'charge']
|
|
20
|
+
if not custom_ligand_dict:
|
|
21
|
+
liglist, ligdents, ligcons = ligand_breakdown(mol, BondedOct=True) # Complex is assumed to be octahedral
|
|
22
|
+
ax_ligand_list, eq_ligand_list, ax_natoms_list, eq_natoms_list, ax_con_int_list, eq_con_int_list, ax_con_list, eq_con_list, built_ligand_list = ligand_assign(
|
|
23
|
+
mol, liglist, ligdents, ligcons, loud, name=False)
|
|
24
|
+
else:
|
|
25
|
+
ax_ligand_list = custom_ligand_dict["ax_ligand_list"]
|
|
26
|
+
eq_ligand_list = custom_ligand_dict["eq_ligand_list"]
|
|
27
|
+
ax_con_int_list = custom_ligand_dict["ax_con_int_list"]
|
|
28
|
+
eq_con_int_list = custom_ligand_dict["eq_con_int_list"]
|
|
29
|
+
# count ligands
|
|
30
|
+
n_ax = len(ax_ligand_list)
|
|
31
|
+
n_eq = len(eq_ligand_list)
|
|
32
|
+
# allocate
|
|
33
|
+
result_ax_dent = False
|
|
34
|
+
result_eq_dent = False
|
|
35
|
+
result_ax_maxdelen = False
|
|
36
|
+
result_eq_maxdelen = False
|
|
37
|
+
result_ax_ki = False
|
|
38
|
+
result_eq_ki = False
|
|
39
|
+
result_ax_tki = False
|
|
40
|
+
result_eq_tki = False
|
|
41
|
+
result_ax_charge = False
|
|
42
|
+
result_eq_charge = False
|
|
43
|
+
# loop over axial ligands
|
|
44
|
+
if n_ax > 0:
|
|
45
|
+
for i in range(0, n_ax):
|
|
46
|
+
ax_ligand_list[i].mol.convert2OBMol()
|
|
47
|
+
if not (i == 0):
|
|
48
|
+
result_ax_dent += ax_ligand_list[i].dent
|
|
49
|
+
if force_legacy:
|
|
50
|
+
result_ax_maxdelen += get_lig_EN(
|
|
51
|
+
ax_ligand_list[i].mol, ax_con_int_list[i])
|
|
52
|
+
result_ax_ki += kier(ax_ligand_list[i].mol)
|
|
53
|
+
result_ax_tki += get_truncated_kier(
|
|
54
|
+
ax_ligand_list[i].mol, ax_con_int_list[i])
|
|
55
|
+
result_ax_charge += ax_ligand_list[i].mol.OBMol.GetTotalCharge()
|
|
56
|
+
else:
|
|
57
|
+
result_ax_dent = ax_ligand_list[i].dent
|
|
58
|
+
if force_legacy:
|
|
59
|
+
result_ax_maxdelen = get_lig_EN(
|
|
60
|
+
ax_ligand_list[i].mol, ax_con_int_list[i])
|
|
61
|
+
result_ax_ki = kier(ax_ligand_list[i].mol)
|
|
62
|
+
result_ax_tki = get_truncated_kier(
|
|
63
|
+
ax_ligand_list[i].mol, ax_con_int_list[i])
|
|
64
|
+
result_ax_charge = ax_ligand_list[i].mol.OBMol.GetTotalCharge()
|
|
65
|
+
# average axial results
|
|
66
|
+
result_ax_dent = np.divide(result_ax_dent, n_ax)
|
|
67
|
+
if force_legacy:
|
|
68
|
+
result_ax_maxdelen = np.divide(result_ax_maxdelen, n_ax)
|
|
69
|
+
result_ax_ki = np.divide(result_ax_ki, n_ax)
|
|
70
|
+
result_ax_tki = np.divide(result_ax_tki, n_ax)
|
|
71
|
+
result_ax_charge = np.divide(result_ax_charge, n_ax)
|
|
72
|
+
|
|
73
|
+
# loop over eq ligands
|
|
74
|
+
if n_eq > 0:
|
|
75
|
+
for i in range(0, n_eq):
|
|
76
|
+
eq_ligand_list[i].mol.convert2OBMol()
|
|
77
|
+
if not (i == 0):
|
|
78
|
+
result_eq_dent += eq_ligand_list[i].dent
|
|
79
|
+
if force_legacy:
|
|
80
|
+
result_eq_maxdelen += get_lig_EN(
|
|
81
|
+
eq_ligand_list[i].mol, eq_con_int_list[i])
|
|
82
|
+
result_eq_ki += kier(eq_ligand_list[i].mol)
|
|
83
|
+
result_eq_tki += get_truncated_kier(
|
|
84
|
+
eq_ligand_list[i].mol, eq_con_int_list[i])
|
|
85
|
+
result_eq_charge += eq_ligand_list[i].mol.OBMol.GetTotalCharge()
|
|
86
|
+
else:
|
|
87
|
+
result_eq_dent = eq_ligand_list[i].dent
|
|
88
|
+
if force_legacy:
|
|
89
|
+
result_eq_maxdelen = get_lig_EN(
|
|
90
|
+
eq_ligand_list[i].mol, eq_con_int_list[i])
|
|
91
|
+
result_eq_ki = kier(eq_ligand_list[i].mol)
|
|
92
|
+
result_eq_tki = get_truncated_kier(
|
|
93
|
+
eq_ligand_list[i].mol, eq_con_int_list[i])
|
|
94
|
+
result_eq_charge = eq_ligand_list[i].mol.OBMol.GetTotalCharge()
|
|
95
|
+
# average eq results
|
|
96
|
+
result_eq_dent = np.divide(result_eq_dent, n_eq)
|
|
97
|
+
if force_legacy:
|
|
98
|
+
result_eq_maxdelen = np.divide(result_eq_maxdelen, n_eq)
|
|
99
|
+
result_eq_ki = np.divide(result_eq_ki, n_eq)
|
|
100
|
+
result_eq_tki = np.divide(result_eq_tki, n_eq)
|
|
101
|
+
result_eq_charge = np.divide(result_eq_charge, n_eq)
|
|
102
|
+
# save the results
|
|
103
|
+
result_ax.append(result_ax_dent)
|
|
104
|
+
if force_legacy:
|
|
105
|
+
result_ax.append(result_ax_maxdelen)
|
|
106
|
+
result_ax.append(result_ax_ki)
|
|
107
|
+
result_ax.append(result_ax_tki)
|
|
108
|
+
result_ax.append(result_ax_charge)
|
|
109
|
+
|
|
110
|
+
result_eq.append(result_eq_dent)
|
|
111
|
+
if force_legacy:
|
|
112
|
+
result_eq.append(result_eq_maxdelen)
|
|
113
|
+
result_eq.append(result_eq_ki)
|
|
114
|
+
result_eq.append(result_eq_tki)
|
|
115
|
+
result_eq.append(result_eq_charge)
|
|
116
|
+
|
|
117
|
+
results_dictionary = {'colnames': colnames,
|
|
118
|
+
'result_ax': result_ax, 'result_eq': result_eq}
|
|
119
|
+
return results_dictionary
|
|
120
|
+
|
|
121
|
+
|
|
122
|
+
def generate_all_ligand_misc_dimers(mol, loud, custom_ligand_dict=False):
|
|
123
|
+
# custom_ligand_dict.keys() must be ax1_ligands_list, ax2_ligand_list, ax3_ligand_list
|
|
124
|
+
## ax1_con_int_list , ax2_con_int_list, ax3_con_int_list
|
|
125
|
+
# with types: ax_{i}_ligand_list list of mol3D
|
|
126
|
+
# ax_{i}_con_int_list list of list/tuple of int e.g, [[1,2] [1,2]]
|
|
127
|
+
result_ax1 = list()
|
|
128
|
+
result_ax2 = list()
|
|
129
|
+
result_ax3 = list()
|
|
130
|
+
result_axs = [result_ax1, result_ax2, result_ax3]
|
|
131
|
+
colnames = ['dent', 'maxDEN', 'ki', 'tki', 'charge']
|
|
132
|
+
if not custom_ligand_dict:
|
|
133
|
+
raise ValueError('No custom_ligand_dict provided!')
|
|
134
|
+
#liglist, ligdents, ligcons = ligand_breakdown(mol, BondedOct=True)
|
|
135
|
+
# ax_ligand_list, eq_ligand_list, ax_natoms_list, eq_natoms_list, ax_con_int_list, eq_con_int_list, ax_con_list, eq_con_list, built_ligand_list = ligand_assign(
|
|
136
|
+
# mol, liglist, ligdents, ligcons, loud, name=False)
|
|
137
|
+
else:
|
|
138
|
+
ax1_ligand_list = custom_ligand_dict["ax1_ligand_list"]
|
|
139
|
+
ax2_ligand_list = custom_ligand_dict["ax2_ligand_list"]
|
|
140
|
+
ax3_ligand_list = custom_ligand_dict["ax3_ligand_list"]
|
|
141
|
+
ax1_con_int_list = custom_ligand_dict["ax1_con_int_list"]
|
|
142
|
+
ax2_con_int_list = custom_ligand_dict["ax2_con_int_list"]
|
|
143
|
+
ax3_con_int_list = custom_ligand_dict["ax3_con_int_list"]
|
|
144
|
+
axligs = [ax1_ligand_list, ax2_ligand_list, ax3_ligand_list]
|
|
145
|
+
axcons = [ax1_con_int_list, ax2_con_int_list, ax3_con_int_list]
|
|
146
|
+
n_axs = [len(i) for i in axligs]
|
|
147
|
+
# allocate
|
|
148
|
+
'''
|
|
149
|
+
result_ax_dent = False
|
|
150
|
+
result_eq_dent = False
|
|
151
|
+
result_ax_maxdelen = False
|
|
152
|
+
result_eq_maxdelen = False
|
|
153
|
+
result_ax_ki = False
|
|
154
|
+
result_eq_ki = False
|
|
155
|
+
result_ax_tki = False
|
|
156
|
+
result_eq_tki = False
|
|
157
|
+
result_ax_charge = False
|
|
158
|
+
result_eq_charge = False
|
|
159
|
+
'''
|
|
160
|
+
# loop over axial ligands
|
|
161
|
+
assert all([i > 0 for i in n_axs]
|
|
162
|
+
), 'At least one axis has no ligands. # Ligands: %s' % n_axs
|
|
163
|
+
for ax_ligand_list, ax_con_int_list, n_ax, result_ax in zip(axligs, axcons, n_axs, result_axs):
|
|
164
|
+
for i in range(0, n_ax):
|
|
165
|
+
ax_ligand_list[i].mol.convert2OBMol()
|
|
166
|
+
if i == 0:
|
|
167
|
+
result_ax_dent = ax_ligand_list[i].dent
|
|
168
|
+
result_ax_maxdelen = get_lig_EN(
|
|
169
|
+
ax_ligand_list[i].mol, ax_con_int_list[i])
|
|
170
|
+
result_ax_ki = kier(ax_ligand_list[i].mol)
|
|
171
|
+
result_ax_tki = get_truncated_kier(
|
|
172
|
+
ax_ligand_list[i].mol, ax_con_int_list[i])
|
|
173
|
+
result_ax_charge = ax_ligand_list[i].mol.OBMol.GetTotalCharge()
|
|
174
|
+
else:
|
|
175
|
+
result_ax_dent += ax_ligand_list[i].dent
|
|
176
|
+
result_ax_maxdelen += get_lig_EN(
|
|
177
|
+
ax_ligand_list[i].mol, ax_con_int_list[i])
|
|
178
|
+
result_ax_ki += kier(ax_ligand_list[i].mol)
|
|
179
|
+
result_ax_tki += get_truncated_kier(
|
|
180
|
+
ax_ligand_list[i].mol, ax_con_int_list[i])
|
|
181
|
+
result_ax_charge += ax_ligand_list[i].mol.OBMol.GetTotalCharge()
|
|
182
|
+
# average axial results
|
|
183
|
+
result_ax_dent = np.divide(result_ax_dent, n_ax)
|
|
184
|
+
result_ax_maxdelen = np.divide(result_ax_maxdelen, n_ax)
|
|
185
|
+
result_ax_ki = np.divide(result_ax_ki, n_ax)
|
|
186
|
+
result_ax_tki = np.divide(result_ax_tki, n_ax)
|
|
187
|
+
result_ax_charge = np.divide(result_ax_charge, n_ax)
|
|
188
|
+
|
|
189
|
+
result_ax.append(result_ax_dent)
|
|
190
|
+
result_ax.append(result_ax_maxdelen)
|
|
191
|
+
result_ax.append(result_ax_ki)
|
|
192
|
+
result_ax.append(result_ax_tki)
|
|
193
|
+
result_ax.append(result_ax_charge)
|
|
194
|
+
assert all([len(i) > 0 for i in [result_ax1, result_ax2,
|
|
195
|
+
result_ax3]]), 'Some results are empty.'
|
|
196
|
+
results_dictionary = {'colnames': colnames, 'result_ax1': result_ax1,
|
|
197
|
+
'result_ax2': result_ax2, 'result_ax3': result_ax3}
|
|
198
|
+
return results_dictionary
|
|
@@ -0,0 +1,61 @@
|
|
|
1
|
+
from rdkit import Chem
|
|
2
|
+
from rdkit.Chem import AllChem
|
|
3
|
+
from molSimplify.Classes.mol3D import mol3D
|
|
4
|
+
|
|
5
|
+
|
|
6
|
+
# Nice explanation of fingerprints here:
|
|
7
|
+
# https://www.rdkit.org/UGM/2012/Landrum_RDKit_UGM.Fingerprints.Final.pptx.pdf
|
|
8
|
+
# Nice tutorial here:
|
|
9
|
+
# https://www.rdkit.org/docs/GettingStartedInPython.html
|
|
10
|
+
# Morgan paper: JCIM 50:742-54 (2010).
|
|
11
|
+
|
|
12
|
+
# This script takes in a mol3D object and gets an ECFP.
|
|
13
|
+
# This assumes that you can get the smiles from the mol3D,
|
|
14
|
+
# which can be obtained by the bound method "get_smiles"
|
|
15
|
+
# of the mol3D class. RDKit has functionality for
|
|
16
|
+
# drawing the necessary bits --> DrawMorganBit
|
|
17
|
+
# @param --> mol3D class of molecule, returns fingerprint
|
|
18
|
+
def get_morgan(mol, morgan_radius=4):
|
|
19
|
+
if isinstance(mol, mol3D):
|
|
20
|
+
smiles = mol.get_smiles(use_mol2=True)
|
|
21
|
+
elif isinstance(mol, str):
|
|
22
|
+
smiles = mol
|
|
23
|
+
else:
|
|
24
|
+
raise ValueError("First argument not a smiles string or mol3D")
|
|
25
|
+
m = Chem.MolFromSmiles(smiles)
|
|
26
|
+
# empty bit dictionary that gets populated
|
|
27
|
+
# Morgan FPs should be compared with tanimoto similarity
|
|
28
|
+
# By default, Morgan FPs have 2048 bits.
|
|
29
|
+
bit_vector = {}
|
|
30
|
+
morgan_fingerprint_vector = AllChem.GetMorganFingerprintAsBitVect(m, radius=morgan_radius, bitInfo=bit_vector)
|
|
31
|
+
return bit_vector
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
def get_substructure_smiles(mol, atomID, radius):
|
|
35
|
+
if isinstance(mol, mol3D):
|
|
36
|
+
smiles = mol.get_smiles(use_mol2=True)
|
|
37
|
+
elif isinstance(mol, str):
|
|
38
|
+
smiles = mol
|
|
39
|
+
else:
|
|
40
|
+
raise ValueError("First argument not a smiles string or mol3D")
|
|
41
|
+
m = Chem.MolFromSmiles(smiles)
|
|
42
|
+
if radius > 0:
|
|
43
|
+
environment_morgan = Chem.FindAtomEnvironmentOfRadiusN(m, radius, atomID)
|
|
44
|
+
atoms_to_use = []
|
|
45
|
+
for b in environment_morgan:
|
|
46
|
+
atoms_to_use.append(m.GetBondWithIdx(b).GetBeginAtomIdx())
|
|
47
|
+
atoms_to_use.append(m.GetBondWithIdx(b).GetEndAtomIdx())
|
|
48
|
+
atoms_to_use = list(set(atoms_to_use))
|
|
49
|
+
else:
|
|
50
|
+
atoms_to_use = [atomID]
|
|
51
|
+
environment_morgan = None
|
|
52
|
+
smiles_1 = Chem.MolFragmentToSmiles(m, atoms_to_use, bondsToUse=environment_morgan,
|
|
53
|
+
allHsExplicit=True, allBondsExplicit=True, rootedAtAtom=atomID)
|
|
54
|
+
return smiles_1
|
|
55
|
+
|
|
56
|
+
# bit_vector_benzene = get_morgan(mol='c1ccccc1')
|
|
57
|
+
# smi = get_substructure_smiles('c1ccccc1',list(bit_vector_benzene.values())[0][0][0],list(bit_vector_benzene.values())[0][0][1])
|
|
58
|
+
# print(smi) # this tells you the substructures in the bit
|
|
59
|
+
# bit_vector_pyridine = get_morgan(mol='c1ncccc1')
|
|
60
|
+
# below you can see what pyridine and benzene have in common
|
|
61
|
+
# print(set(bit_vector.keys()).intersection(bit_vector_py.keys()))
|