stjames 0.0.122__py3-none-any.whl → 0.0.123__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of stjames might be problematic. Click here for more details.
- stjames/workflows/conformer_search.py +25 -2
- stjames/workflows/dna.py +13 -0
- stjames/workflows/protein.py +15 -0
- stjames/workflows/protein_cofolding.py +5 -1
- stjames/workflows/rna.py +13 -0
- stjames/workflows/workflow.py +22 -18
- {stjames-0.0.122.dist-info → stjames-0.0.123.dist-info}/METADATA +1 -1
- {stjames-0.0.122.dist-info → stjames-0.0.123.dist-info}/RECORD +11 -8
- {stjames-0.0.122.dist-info → stjames-0.0.123.dist-info}/WHEEL +0 -0
- {stjames-0.0.122.dist-info → stjames-0.0.123.dist-info}/licenses/LICENSE +0 -0
- {stjames-0.0.122.dist-info → stjames-0.0.123.dist-info}/top_level.txt +0 -0
|
@@ -41,11 +41,24 @@ class ScreeningSettings(BaseModel):
|
|
|
41
41
|
max_confs: int | None = None
|
|
42
42
|
|
|
43
43
|
|
|
44
|
+
class ConformerClusteringDescriptor(LowercaseStrEnum):
|
|
45
|
+
"""
|
|
46
|
+
Potential descriptors to employ in conformer clustering.
|
|
47
|
+
"""
|
|
48
|
+
|
|
49
|
+
SOLVENT_ACCESSIBLE_SURFACE_AREA = "solvent_accessible_surface_area"
|
|
50
|
+
POLAR_SOLVENT_ACCESSIBLE_SURACE_AREA = "polar_solvent_accessible_surface_area"
|
|
51
|
+
RADIUS_OF_GYRATION = "radius_of_gyration"
|
|
52
|
+
PLANE_OF_BEST_FIT = "plane_of_best_fit"
|
|
53
|
+
NORMALIZED_PRINCIPAL_MOMENT_RATIO_1 = "normalized_principal_moment_ratio_1"
|
|
54
|
+
NORMALIZED_PRINCIPAL_MOMENT_RATIO_2 = "normalized_principal_moment_ratio_2"
|
|
55
|
+
|
|
56
|
+
|
|
44
57
|
class ConformerClusteringSettings(Base):
|
|
45
58
|
"""
|
|
46
|
-
Settings for
|
|
59
|
+
Settings for clustering conformers based on their three-dimensional properties.
|
|
47
60
|
|
|
48
|
-
The properties used for clustering are:
|
|
61
|
+
The properties used for clustering by default are:
|
|
49
62
|
- Solvent-accessible surface area
|
|
50
63
|
- Polar solvent-accessible surface area
|
|
51
64
|
- Radius of gyration
|
|
@@ -59,6 +72,15 @@ class ConformerClusteringSettings(Base):
|
|
|
59
72
|
:param conformers_per_cluster: the number of compounds to pick from each cluster
|
|
60
73
|
"""
|
|
61
74
|
|
|
75
|
+
descriptors: list[ConformerClusteringDescriptor] = [
|
|
76
|
+
ConformerClusteringDescriptor.SOLVENT_ACCESSIBLE_SURFACE_AREA,
|
|
77
|
+
ConformerClusteringDescriptor.POLAR_SOLVENT_ACCESSIBLE_SURACE_AREA,
|
|
78
|
+
ConformerClusteringDescriptor.RADIUS_OF_GYRATION,
|
|
79
|
+
ConformerClusteringDescriptor.PLANE_OF_BEST_FIT,
|
|
80
|
+
ConformerClusteringDescriptor.NORMALIZED_PRINCIPAL_MOMENT_RATIO_1,
|
|
81
|
+
ConformerClusteringDescriptor.NORMALIZED_PRINCIPAL_MOMENT_RATIO_2,
|
|
82
|
+
]
|
|
83
|
+
|
|
62
84
|
num_clusters: PositiveInt = 5
|
|
63
85
|
conformers_per_cluster: PositiveInt = 3
|
|
64
86
|
|
|
@@ -324,6 +346,7 @@ class ConformerGenMixin(BaseModel):
|
|
|
324
346
|
:param constraints: constraints to add
|
|
325
347
|
:param nci: add a constraining potential for non-covalent interactions
|
|
326
348
|
:param max_confs: maximum number of conformers to keep
|
|
349
|
+
:param clustering_settings: how to cluster the conformers (if at all)
|
|
327
350
|
"""
|
|
328
351
|
|
|
329
352
|
conf_gen_mode: Mode = Mode.RAPID
|
stjames/workflows/dna.py
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
"""Protein-related workflow data models."""
|
|
2
|
+
|
|
3
|
+
from ..base import Base
|
|
4
|
+
|
|
5
|
+
|
|
6
|
+
class ProteinSequence(Base):
|
|
7
|
+
"""
|
|
8
|
+
Protein sequence metadata including cyclic flag.
|
|
9
|
+
|
|
10
|
+
:param sequence: amino-acid sequence string
|
|
11
|
+
:param cyclic: whether this sequence forms a cyclic peptide (defaults to False)
|
|
12
|
+
"""
|
|
13
|
+
|
|
14
|
+
sequence: str
|
|
15
|
+
cyclic: bool = False
|
|
@@ -68,10 +68,14 @@ class AffinityScore(BaseModel):
|
|
|
68
68
|
|
|
69
69
|
class ProteinCofoldingWorkflow(FASTAWorkflow):
|
|
70
70
|
"""
|
|
71
|
-
|
|
71
|
+
Workflow for predicting structures.
|
|
72
|
+
|
|
73
|
+
Especially protein structures. At least one biological sequence is required.
|
|
72
74
|
|
|
73
75
|
Inherited:
|
|
74
76
|
:param initial_protein_sequences: protein sequences of interest
|
|
77
|
+
:param initial_dna_sequences: DNA sequences of interest
|
|
78
|
+
:param initial_rna_sequences: RNA sequences of interest
|
|
75
79
|
:param initial_smiles_list: SMILES strings of interest
|
|
76
80
|
|
|
77
81
|
New:
|
stjames/workflows/rna.py
ADDED
stjames/workflows/workflow.py
CHANGED
|
@@ -1,5 +1,7 @@
|
|
|
1
1
|
"""Base classes for workflows."""
|
|
2
2
|
|
|
3
|
+
from typing import Any
|
|
4
|
+
|
|
3
5
|
from pydantic import field_validator
|
|
4
6
|
|
|
5
7
|
from ..base import Base
|
|
@@ -7,6 +9,9 @@ from ..message import Message
|
|
|
7
9
|
from ..mode import Mode
|
|
8
10
|
from ..molecule import Molecule
|
|
9
11
|
from ..types import UUID
|
|
12
|
+
from .dna import DNASequence
|
|
13
|
+
from .protein import ProteinSequence
|
|
14
|
+
from .rna import RNASequence
|
|
10
15
|
|
|
11
16
|
|
|
12
17
|
class Workflow(Base):
|
|
@@ -22,31 +27,30 @@ class Workflow(Base):
|
|
|
22
27
|
return repr(self)
|
|
23
28
|
|
|
24
29
|
|
|
25
|
-
class ProteinSequence(Base):
|
|
26
|
-
"""
|
|
27
|
-
Protein sequence metadata including cyclic flag.
|
|
28
|
-
|
|
29
|
-
:param sequence: amino-acid sequence string
|
|
30
|
-
:param cyclic: whether this sequence forms a cyclic peptide (defaults to False)
|
|
31
|
-
"""
|
|
32
|
-
|
|
33
|
-
sequence: str
|
|
34
|
-
cyclic: bool = False
|
|
35
|
-
|
|
36
|
-
|
|
37
30
|
class FASTAWorkflow(Workflow):
|
|
38
31
|
"""
|
|
39
|
-
Base class for Workflows that operate on
|
|
32
|
+
Base class for Workflows that operate on biological sequences and SMILES.
|
|
40
33
|
|
|
41
|
-
:param initial_protein_sequences:
|
|
34
|
+
:param initial_protein_sequences: protein sequences to evaluate, either plain sequence strings or ProteinSequence objects with metadata
|
|
35
|
+
:param initial_dna_sequences: DNA sequences to evaluate, either plain sequence strings or DNASequence objects with metadata
|
|
36
|
+
:param initial_rna_sequences: RNA sequences to evaluate, either plain sequence strings or RNASequence objects with metadata
|
|
42
37
|
:param initial_smiles_list: SMILES strings of interest
|
|
43
38
|
:param ligand_binding_affinity_index: optional index selecting which ligand affinity to evaluate
|
|
39
|
+
:raises ValueError: if none of the sequence lists are provided
|
|
44
40
|
"""
|
|
45
41
|
|
|
46
|
-
initial_protein_sequences: list[ProteinSequence] | list[str]
|
|
47
|
-
|
|
42
|
+
initial_protein_sequences: list[ProteinSequence] | list[str] = []
|
|
43
|
+
initial_dna_sequences: list[DNASequence] = []
|
|
44
|
+
initial_rna_sequences: list[RNASequence] = []
|
|
45
|
+
initial_smiles_list: list[str] = []
|
|
48
46
|
ligand_binding_affinity_index: int | None = None
|
|
49
47
|
|
|
48
|
+
def model_post_init(self, __context: Any) -> None:
|
|
49
|
+
if not (self.initial_protein_sequences or self.initial_dna_sequences or self.initial_rna_sequences):
|
|
50
|
+
raise ValueError(
|
|
51
|
+
"Provide at least one of `initial_protein_sequences`, `initial_dna_sequences`, or `initial_rna_sequences`.",
|
|
52
|
+
)
|
|
53
|
+
|
|
50
54
|
|
|
51
55
|
class SMILESWorkflow(Workflow):
|
|
52
56
|
"""
|
|
@@ -99,10 +103,10 @@ class ProteinSequenceWorkflow(Workflow):
|
|
|
99
103
|
"""
|
|
100
104
|
Base class for Workflows that operate on protein sequences.
|
|
101
105
|
|
|
102
|
-
:param initial_protein_sequences: protein sequences
|
|
106
|
+
:param initial_protein_sequences: protein sequences to evaluate, either plain sequence strings or ProteinSequence objects with metadata
|
|
103
107
|
"""
|
|
104
108
|
|
|
105
|
-
|
|
109
|
+
initial_protein_sequences: list[ProteinSequence] | list[str] = []
|
|
106
110
|
|
|
107
111
|
|
|
108
112
|
class DBCalculation(Base):
|
|
@@ -43,8 +43,9 @@ stjames/workflows/basic_calculation.py,sha256=wIiq2lFRN4nxN0__X_JbPSeaUeJ4tKUyg6
|
|
|
43
43
|
stjames/workflows/batch_docking.py,sha256=o-t5FkfLlbe60jX1_ZeqWSJJ5vsjEIbTa5GLN3ny_tk,1590
|
|
44
44
|
stjames/workflows/bde.py,sha256=g_In-caftXiimrhfdptHjpfrYQUs3vF58qYmRnaTN8g,10825
|
|
45
45
|
stjames/workflows/conformer.py,sha256=18aO6ngMBeGAmQkBdLGCCHr398RIYr1v2hD2IT1u4cc,3005
|
|
46
|
-
stjames/workflows/conformer_search.py,sha256=
|
|
46
|
+
stjames/workflows/conformer_search.py,sha256=TaDI3unNjaxBKj4YHASwSaNQHlVSwuZDZdTIxk7MC4Y,17638
|
|
47
47
|
stjames/workflows/descriptors.py,sha256=T4tc7xdtBdxESGO86KR323jPQ2pgwxBqgV0khA6MEgQ,584
|
|
48
|
+
stjames/workflows/dna.py,sha256=_M79WikFujCsUWr4YaEdOoeDDKPV_DhKptWt0ptktko,194
|
|
48
49
|
stjames/workflows/docking.py,sha256=t30kqeFXQ0yrlqvN6Jdwt0SdfnJLDsfK-7yFi0gwNbY,4753
|
|
49
50
|
stjames/workflows/double_ended_ts_search.py,sha256=ovJgEVFc6c3mijCE3TKAY70YvqNmAZ5Y4XgV4-tIxBI,3127
|
|
50
51
|
stjames/workflows/electronic_properties.py,sha256=GT3-NC7w-dbcOJ-3AzJ7LgzH6frTbiH2Iyb9BCa-SvY,4112
|
|
@@ -59,17 +60,19 @@ stjames/workflows/multistage_opt.py,sha256=UN-4WLsT2WEjO5KqDPrcCkb708Co-ZScHx3g2
|
|
|
59
60
|
stjames/workflows/nmr.py,sha256=1QEF4SB6dWIr-jzLEZ7V972UnRUOTufOJSHwIGyV3dM,2681
|
|
60
61
|
stjames/workflows/pka.py,sha256=i-jzl2lN0yRWc0tgrWSBCplITEByfRyEQrlUhjnzcBc,4580
|
|
61
62
|
stjames/workflows/pose_analysis_md.py,sha256=dpWVKC-8fPdw6ExIXk9xbeVBDUMUYQECpixb-oFa23I,4803
|
|
63
|
+
stjames/workflows/protein.py,sha256=MfwJ3qn24cCoUEczMH7A2NyBlI9t_VcwOowohTPDtYM,346
|
|
62
64
|
stjames/workflows/protein_binder_design.py,sha256=KnPKQJTMrSO5xfw64Bh7T0wHck1NtysVwkVgHs1cGws,12013
|
|
63
|
-
stjames/workflows/protein_cofolding.py,sha256=
|
|
65
|
+
stjames/workflows/protein_cofolding.py,sha256=5rs6wgksW5zKpcEkv0_B4Clt9dSQ-42oKF8fJtSRoaY,4495
|
|
64
66
|
stjames/workflows/redox_potential.py,sha256=7S18t9Y3eynSnA3lZbRlvLfdbgeBopdiigLzt1zxg5c,3871
|
|
67
|
+
stjames/workflows/rna.py,sha256=FZO3UkRhgG3EnGXsQ70eAZTbeEY2P9u60oLD6JuPPMc,194
|
|
65
68
|
stjames/workflows/scan.py,sha256=lgpvrrFG03GWQj2tWeBqPQVYSCGLgYdnQsU9bAUZQok,3317
|
|
66
69
|
stjames/workflows/solubility.py,sha256=lfCVvJjqEaddLUpK6WBxjB7u12Sci-K95A5_qIMkIRM,3028
|
|
67
70
|
stjames/workflows/spin_states.py,sha256=0degmE-frovgoXweshZyjfjqL7nkbaFoO9YoJhvQnaI,4748
|
|
68
71
|
stjames/workflows/strain.py,sha256=paYxDDQTB1eYP_c2kLVz1-QX7Vpw0LLb3ujnFin_SOM,1834
|
|
69
72
|
stjames/workflows/tautomer.py,sha256=7eYKziGPg8Km6lfowTzSkgJfJ4SHUPrAmnTf8Bi-SB0,1164
|
|
70
|
-
stjames/workflows/workflow.py,sha256=
|
|
71
|
-
stjames-0.0.
|
|
72
|
-
stjames-0.0.
|
|
73
|
-
stjames-0.0.
|
|
74
|
-
stjames-0.0.
|
|
75
|
-
stjames-0.0.
|
|
73
|
+
stjames/workflows/workflow.py,sha256=dJYK9hY8FqNsD-foQsTI7Mpk2aTY87ASjMFgerx6gtQ,3432
|
|
74
|
+
stjames-0.0.123.dist-info/licenses/LICENSE,sha256=i05z7xEhyrg6f8j0lR3XYjShnF-MJGFQ-DnpsZ8yiVI,1084
|
|
75
|
+
stjames-0.0.123.dist-info/METADATA,sha256=r1v4SR_lfdasc-yuQRdmxI7nJXSnVKvbjQiMz4mwW54,1725
|
|
76
|
+
stjames-0.0.123.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
77
|
+
stjames-0.0.123.dist-info/top_level.txt,sha256=FYCwxl6quhYOAgG-mnPQcCK8vsVM7B8rIUrO-WrQ_PI,8
|
|
78
|
+
stjames-0.0.123.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|