rdworks 0.54.2__py3-none-any.whl → 0.56.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- rdworks/__init__.py +4 -5
- rdworks/{workflow.py → complete.py} +41 -8
- rdworks/conf.py +2 -2
- rdworks/microstates.py +7 -0
- {rdworks-0.54.2.dist-info → rdworks-0.56.1.dist-info}/METADATA +1 -1
- {rdworks-0.54.2.dist-info → rdworks-0.56.1.dist-info}/RECORD +9 -10
- rdworks/pka.py +0 -38
- {rdworks-0.54.2.dist-info → rdworks-0.56.1.dist-info}/WHEEL +0 -0
- {rdworks-0.54.2.dist-info → rdworks-0.56.1.dist-info}/licenses/LICENSE +0 -0
- {rdworks-0.54.2.dist-info → rdworks-0.56.1.dist-info}/top_level.txt +0 -0
rdworks/__init__.py
CHANGED
@@ -1,16 +1,15 @@
|
|
1
|
-
__version__ = '0.
|
1
|
+
__version__ = '0.56.1'
|
2
2
|
|
3
3
|
from rdworks.conf import Conf
|
4
4
|
from rdworks.mol import Mol
|
5
5
|
from rdworks.mollibr import MolLibr
|
6
6
|
|
7
|
-
from rdworks.workflow import complete_stereoisomers, complete_tautomers
|
8
|
-
|
9
|
-
from rdworks.ionized import IonizedStates
|
10
|
-
|
11
7
|
from rdworks.readin import read_csv, merge_csv, read_dataframe, read_smi, read_sdf, read_mae
|
12
8
|
from rdworks.std import desalt_smiles, standardize_smiles, standardize
|
13
9
|
|
10
|
+
from rdworks.complete import complete_stereoisomers, complete_tautomers
|
11
|
+
from rdworks.ionized import IonizedStates
|
12
|
+
|
14
13
|
from rdworks.rgroup import expand_rgroup, most_common, most_common_in_NP
|
15
14
|
from rdworks.scaffold import scaffold_network, scaffold_tree, BRICS_fragmented, BRICS_fragment_indices
|
16
15
|
from rdworks.matchedseries import MatchedSeries
|
@@ -1,10 +1,8 @@
|
|
1
|
-
|
1
|
+
from rdworks import Mol, MolLibr
|
2
2
|
from rdworks.stereoisomers import enumerate_stereoisomers, enumerate_ring_bond_stereoisomers
|
3
|
-
from rdworks.mol import Mol
|
4
|
-
from rdworks.mollibr import MolLibr
|
5
|
-
|
6
3
|
from rdkit import Chem
|
7
4
|
from rdkit.Chem.MolStandardize import rdMolStandardize
|
5
|
+
from rdkit.Chem.EnumerateStereoisomers import EnumerateStereoisomers, StereoEnumerationOptions
|
8
6
|
|
9
7
|
|
10
8
|
def complete_stereoisomers(molecular_input: str | Chem.Mol | Mol,
|
@@ -26,6 +24,8 @@ def complete_stereoisomers(molecular_input: str | Chem.Mol | Mol,
|
|
26
24
|
Returns:
|
27
25
|
MolLibr: a library of complete stereoisomers.
|
28
26
|
"""
|
27
|
+
from rdworks import Mol, MolLibr
|
28
|
+
|
29
29
|
if isinstance(molecular_input, Mol):
|
30
30
|
if name:
|
31
31
|
mol = molecular_input.rename(name)
|
@@ -66,6 +66,18 @@ def complete_stereoisomers(molecular_input: str | Chem.Mol | Mol,
|
|
66
66
|
return libr
|
67
67
|
|
68
68
|
|
69
|
+
def can_have_stereo(bond):
|
70
|
+
"""Check if a double bond can have E/Z stereochemistry"""
|
71
|
+
atom1, atom2 = bond.GetBeginAtom(), bond.GetEndAtom()
|
72
|
+
|
73
|
+
# Check if both atoms have at least 2 non-hydrogen neighbors
|
74
|
+
for atom in [atom1, atom2]:
|
75
|
+
non_h_neighbors = [n for n in atom.GetNeighbors() if n.GetAtomicNum() != 1]
|
76
|
+
if len(non_h_neighbors) < 2:
|
77
|
+
return False
|
78
|
+
|
79
|
+
return True
|
80
|
+
|
69
81
|
|
70
82
|
def complete_tautomers(mol: Mol, **kwargs) -> MolLibr:
|
71
83
|
"""Returns a library of enumerated tautomers.
|
@@ -77,9 +89,30 @@ def complete_tautomers(mol: Mol, **kwargs) -> MolLibr:
|
|
77
89
|
MolLibr: a library of enumerated tautomers.
|
78
90
|
"""
|
79
91
|
enumerator = rdMolStandardize.TautomerEnumerator()
|
80
|
-
|
92
|
+
enumerator.SetRemoveSp3Stereo(False)
|
93
|
+
enumerator.SetRemoveBondStereo(False) # Don't remove existing stereo
|
94
|
+
tautomers = list(enumerator.Enumerate(mol.rdmol))
|
95
|
+
|
96
|
+
all_stereoisomers = []
|
97
|
+
|
98
|
+
for tautomer in tautomers:
|
99
|
+
# Find unspecified double bonds that could have E/Z stereo
|
100
|
+
unspecified_bonds = []
|
101
|
+
for bond in tautomer.GetBonds():
|
102
|
+
if (bond.GetBondType() == Chem.BondType.DOUBLE and
|
103
|
+
bond.GetStereo() == Chem.BondStereo.STEREONONE and
|
104
|
+
can_have_stereo(bond)):
|
105
|
+
unspecified_bonds.append(bond.GetIdx())
|
106
|
+
|
107
|
+
if unspecified_bonds:
|
108
|
+
# Enumerate all possible stereoisomers
|
109
|
+
opts = StereoEnumerationOptions(onlyUnassigned=True, maxIsomers=50)
|
110
|
+
stereoisomers = list(EnumerateStereoisomers(tautomer, options=opts))
|
111
|
+
all_stereoisomers.extend(stereoisomers)
|
112
|
+
else:
|
113
|
+
all_stereoisomers.append(tautomer)
|
81
114
|
|
82
|
-
if len(
|
83
|
-
return MolLibr(
|
115
|
+
if len(all_stereoisomers) > 1:
|
116
|
+
return MolLibr(all_stereoisomers).unique().rename(mol.name, sep='.').compute(**kwargs)
|
84
117
|
|
85
|
-
return MolLibr(
|
118
|
+
return MolLibr(all_stereoisomers).compute(**kwargs)
|
rdworks/conf.py
CHANGED
@@ -546,9 +546,9 @@ class Conf:
|
|
546
546
|
conf = frag_conf.copy()
|
547
547
|
conf.set_torsion(*frag_ijkl, angle) # atoms bonded to `l` move.
|
548
548
|
conf = conf.optimize(calculator, fmax, **kwargs)
|
549
|
+
data['angle'].append(angle)
|
549
550
|
# conf.optimize() updates coordinates and conf.props:
|
550
551
|
# `E_tot_init(kcal/mol)`, `E_tot(kcal/mol)`, `Converged`.
|
551
|
-
data['angle'].append(angle)
|
552
552
|
data['init'].append(conf.props['E_tot_init(kcal/mol)'])
|
553
553
|
data['last'].append(conf.props['E_tot(kcal/mol)'])
|
554
554
|
data['Converged'].append(conf.props['Converged'])
|
@@ -562,9 +562,9 @@ class Conf:
|
|
562
562
|
conf = ref_conf.copy()
|
563
563
|
conf.set_torsion(*indices, angle) # atoms bonded to `l` move.
|
564
564
|
conf = conf.optimize(calculator, fmax, **kwargs)
|
565
|
+
data['angle'].append(angle)
|
565
566
|
# conf.optimize() updates coordinates and conf.props:
|
566
567
|
# `E_tot_init(kcal/mol)`, `E_tot(kcal/mol)`, `Converged`.
|
567
|
-
data['angle'].append(conf.props['angle'])
|
568
568
|
data['init'].append(conf.props['E_tot_init(kcal/mol)'])
|
569
569
|
data['last'].append(conf.props['E_tot(kcal/mol)'])
|
570
570
|
data['Converged'].append(conf.props['Converged'])
|
rdworks/microstates.py
CHANGED
@@ -4,9 +4,16 @@ import itertools
|
|
4
4
|
import logging
|
5
5
|
|
6
6
|
from types import SimpleNamespace
|
7
|
+
from pathlib import Path
|
7
8
|
from rdworks import Conf, Mol
|
8
9
|
from rdworks.xtb.wrapper import GFN2xTB
|
9
10
|
|
11
|
+
from rdkit import Chem
|
12
|
+
from rdkit.Chem import (
|
13
|
+
AllChem, RemoveHs, CanonSmiles, MolFromSmarts,
|
14
|
+
GetFormalCharge, RWMol, AddHs, SanitizeMol,
|
15
|
+
MolToSmiles, MolFromSmiles,
|
16
|
+
)
|
10
17
|
|
11
18
|
logger = logging.getLogger(__name__)
|
12
19
|
|
@@ -1,13 +1,13 @@
|
|
1
|
-
rdworks/__init__.py,sha256=
|
2
|
-
rdworks/
|
1
|
+
rdworks/__init__.py,sha256=d-zUnWFkFgiYgKXi2hBDA6KX99RDMX4c8RJqrCpQozw,1356
|
2
|
+
rdworks/complete.py,sha256=MGNw3O66tPN4I2PIrrjz2ufMako0D1KezvHSNjfpRf8,4642
|
3
|
+
rdworks/conf.py,sha256=_4SxHJiaOdK_4KY9adxvQTfzJFudvAQoHRgvejmfyGc,36365
|
3
4
|
rdworks/descriptor.py,sha256=34T_dQ6g8v3u-ym8TLKbQtxIIV5TEo-d3pdedq3o-cg,2106
|
4
5
|
rdworks/display.py,sha256=JR0gR26UpH-JCxVOaqXZCUj2MiGZSrx9Me87FncspVI,13469
|
5
6
|
rdworks/ionized.py,sha256=_t-Ajssv1rytV4Y_KsSbxfnsBKqy-EusbhNUtaWcV6o,7681
|
6
7
|
rdworks/matchedseries.py,sha256=A3ON4CUpQV159mu9VqgNiJ8uoQ9ePOry9d3ra4NCAgc,10377
|
7
|
-
rdworks/microstates.py,sha256=
|
8
|
+
rdworks/microstates.py,sha256=hf_5UDDgZxJGnrqRiv2fbS1j3zq7LMccHSOJbpEgjX8,5503
|
8
9
|
rdworks/mol.py,sha256=4gNjs_ryNNWThMekV794uwjjBE-JLGGWcdyMaS9-xP8,71369
|
9
10
|
rdworks/mollibr.py,sha256=X4UBO6Ga-QmNS7RwUiaDYAx0Q5hnWs71yTkEpH02Qb4,37696
|
10
|
-
rdworks/pka.py,sha256=NVJVfpcNEMlX5QRyLBgUM7GIT7VMjO-llAR4LWc8J2c,1656
|
11
11
|
rdworks/readin.py,sha256=b1BHchQMC5EgQd3C05n72t_aa_9u0iKQWyyIqjyfkPc,11809
|
12
12
|
rdworks/rgroup.py,sha256=ivF2gzmRtt339rxEnkv2KfnCs0CUdBbnSje7Y54rtFI,57996
|
13
13
|
rdworks/scaffold.py,sha256=60T5YacyxZsEpDo_J5Qxulm2YNQO4EQR8PcNUwjn1QU,22026
|
@@ -17,7 +17,6 @@ rdworks/testdata.py,sha256=TmbNPA-ju6nTBt_Yts4EJUFmL9Cd6DCVXrDF42QLlHw,1732
|
|
17
17
|
rdworks/torsion.py,sha256=UUaYOvNS89SlLFauYiAboUqysy32EN0_Gktc4xxuDQI,18788
|
18
18
|
rdworks/units.py,sha256=nljKPHcr6IWoAp0CkL7y1gSNDd6a07NeVfxXwSMuHQM,365
|
19
19
|
rdworks/utils.py,sha256=d2Sio8WTlGPsmBOHIYDCMWg_7X4rTWjJQAqzd7ywo2A,14191
|
20
|
-
rdworks/workflow.py,sha256=MtP9QUGgCKMyI3G4vp8sokos_UyaQvTHFOEPUJresZU,3139
|
21
20
|
rdworks/xml.py,sha256=aaMhwVRGvt1VzasaKDnkYnZ4kp2cIgvGb1CsmMgwQ_c,10704
|
22
21
|
rdworks/autograph/__init__.py,sha256=0Qfjwo0h4Q0n08zsqHRbuNOZms6MuNXnWErnQpQ6Px0,140
|
23
22
|
rdworks/autograph/autograph.py,sha256=frjsUaCTOD-Z1lYPzOxRoTtqMMiYroWAy6tSwKn3CUA,8769
|
@@ -67,8 +66,8 @@ rdworks/predefined/misc/reactive-part-3.xml,sha256=LgWHSEbRTVmgBoIO45xbTo1xQJs0X
|
|
67
66
|
rdworks/predefined/misc/reactive.xml,sha256=syedoQ6VYUfRLnxy99ObuDniJ_a_WhrWAJbTKFfJ6VY,11248
|
68
67
|
rdworks/xtb/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
69
68
|
rdworks/xtb/wrapper.py,sha256=YpZY8SJ9Lrp3I3_GAVawSb_4_Zc8hcJtF5l7-I-Wbys,22048
|
70
|
-
rdworks-0.
|
71
|
-
rdworks-0.
|
72
|
-
rdworks-0.
|
73
|
-
rdworks-0.
|
74
|
-
rdworks-0.
|
69
|
+
rdworks-0.56.1.dist-info/licenses/LICENSE,sha256=UOkJSBqYyQUvtCp7a-vdCANeEcLE2dnTie_eB1By5SY,1074
|
70
|
+
rdworks-0.56.1.dist-info/METADATA,sha256=4jemVgYRM_UDuGjLUOK8vbboQZiqctnx-rrZgnvAg5k,1967
|
71
|
+
rdworks-0.56.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
72
|
+
rdworks-0.56.1.dist-info/top_level.txt,sha256=05C98HbvBK2axUBogC_hAT_CdpOeQYGnQ6vRAgawr8s,8
|
73
|
+
rdworks-0.56.1.dist-info/RECORD,,
|
rdworks/pka.py
DELETED
@@ -1,38 +0,0 @@
|
|
1
|
-
"""This module is an implementation in progress of the decision tree method for pKa prediction.
|
2
|
-
|
3
|
-
Crippen, J. Chem. Inf. Model., Vol. 48, No. 10, 2008, 2042-2053.
|
4
|
-
|
5
|
-
The SMARTS patterns and pKa values were taken from the supporting information of the paper.
|
6
|
-
These "MOE SMARTS" were converted to generic SMARTS which relied on use of some recursive SMARTS patterns.
|
7
|
-
The first data row then describes nodes 1, and then the tree expands out based on decisions of SMARTS-matching:
|
8
|
-
if node 2 is yes to pattern [#8,#16,#34,#52,#84;H]C(=O) - giving pKa 3.68 and range 5.96
|
9
|
-
node 3 is no to the same pattern - giving pKa 7.21 and range 17.32
|
10
|
-
Then nodes 4,5 are under 2 and 6,7 are under 3, etc, etc until the leaf nodes are reached
|
11
|
-
"""
|
12
|
-
|
13
|
-
|
14
|
-
import importlib.resources
|
15
|
-
from collections import namedtuple
|
16
|
-
from typing import Union
|
17
|
-
|
18
|
-
from rdkit import Chem
|
19
|
-
from rdkit.Chem import AllChem
|
20
|
-
|
21
|
-
datadir = importlib.resources.files('rdworks.predefined')
|
22
|
-
DecisionTreeNode = namedtuple('DecisionTree', ('node', 'parent', 'child', 'FP', 'SMARTS', 'YN', 'pKa', 'pKa_range'))
|
23
|
-
decision_tree = []
|
24
|
-
with open(datadir / "pKa_decision_tree.ext", "r") as f:
|
25
|
-
for line in f:
|
26
|
-
if (not line) or line.startswith('#'):
|
27
|
-
continue
|
28
|
-
decision_tree.append(DecisionTreeNode(line.strip().split()))
|
29
|
-
|
30
|
-
|
31
|
-
def decision_tree_pKa(rdmol:Chem.Mol) -> Union[float, None]:
|
32
|
-
pKa = None
|
33
|
-
for _ in decision_tree:
|
34
|
-
patt = Chem.MolFromSmarts(_.SMARTS) # make an RDKit query molecule
|
35
|
-
match = rdmol.HasSubstructMatch(patt) # check if we have a match for our test molecule
|
36
|
-
# pKa = float(values[6])
|
37
|
-
# pKa_range = float(values[7])
|
38
|
-
return pKa
|
File without changes
|
File without changes
|
File without changes
|