stjames 0.0.122__py3-none-any.whl → 0.0.123__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of stjames might be problematic. Click here for more details.

@@ -41,11 +41,24 @@ class ScreeningSettings(BaseModel):
41
41
  max_confs: int | None = None
42
42
 
43
43
 
44
+ class ConformerClusteringDescriptor(LowercaseStrEnum):
45
+ """
46
+ Potential descriptors to employ in conformer clustering.
47
+ """
48
+
49
+ SOLVENT_ACCESSIBLE_SURFACE_AREA = "solvent_accessible_surface_area"
50
+ POLAR_SOLVENT_ACCESSIBLE_SURACE_AREA = "polar_solvent_accessible_surface_area"
51
+ RADIUS_OF_GYRATION = "radius_of_gyration"
52
+ PLANE_OF_BEST_FIT = "plane_of_best_fit"
53
+ NORMALIZED_PRINCIPAL_MOMENT_RATIO_1 = "normalized_principal_moment_ratio_1"
54
+ NORMALIZED_PRINCIPAL_MOMENT_RATIO_2 = "normalized_principal_moment_ratio_2"
55
+
56
+
44
57
  class ConformerClusteringSettings(Base):
45
58
  """
46
- Settings for (optionally) clustering conformers based on three-dimensional properties.
59
+ Settings for clustering conformers based on their three-dimensional properties.
47
60
 
48
- The properties used for clustering are:
61
+ The properties used for clustering by default are:
49
62
  - Solvent-accessible surface area
50
63
  - Polar solvent-accessible surface area
51
64
  - Radius of gyration
@@ -59,6 +72,15 @@ class ConformerClusteringSettings(Base):
59
72
  :param conformers_per_cluster: the number of compounds to pick from each cluster
60
73
  """
61
74
 
75
+ descriptors: list[ConformerClusteringDescriptor] = [
76
+ ConformerClusteringDescriptor.SOLVENT_ACCESSIBLE_SURFACE_AREA,
77
+ ConformerClusteringDescriptor.POLAR_SOLVENT_ACCESSIBLE_SURACE_AREA,
78
+ ConformerClusteringDescriptor.RADIUS_OF_GYRATION,
79
+ ConformerClusteringDescriptor.PLANE_OF_BEST_FIT,
80
+ ConformerClusteringDescriptor.NORMALIZED_PRINCIPAL_MOMENT_RATIO_1,
81
+ ConformerClusteringDescriptor.NORMALIZED_PRINCIPAL_MOMENT_RATIO_2,
82
+ ]
83
+
62
84
  num_clusters: PositiveInt = 5
63
85
  conformers_per_cluster: PositiveInt = 3
64
86
 
@@ -324,6 +346,7 @@ class ConformerGenMixin(BaseModel):
324
346
  :param constraints: constraints to add
325
347
  :param nci: add a constraining potential for non-covalent interactions
326
348
  :param max_confs: maximum number of conformers to keep
349
+ :param clustering_settings: how to cluster the conformers (if at all)
327
350
  """
328
351
 
329
352
  conf_gen_mode: Mode = Mode.RAPID
@@ -0,0 +1,13 @@
1
+ """DNA-related workflow data models."""
2
+
3
+ from ..base import Base
4
+
5
+
6
+ class DNASequence(Base):
7
+ """
8
+ DNA sequence metadata.
9
+
10
+ :param sequence: nucleotide string
11
+ """
12
+
13
+ sequence: str
@@ -0,0 +1,15 @@
1
+ """Protein-related workflow data models."""
2
+
3
+ from ..base import Base
4
+
5
+
6
+ class ProteinSequence(Base):
7
+ """
8
+ Protein sequence metadata including cyclic flag.
9
+
10
+ :param sequence: amino-acid sequence string
11
+ :param cyclic: whether this sequence forms a cyclic peptide (defaults to False)
12
+ """
13
+
14
+ sequence: str
15
+ cyclic: bool = False
@@ -68,10 +68,14 @@ class AffinityScore(BaseModel):
68
68
 
69
69
  class ProteinCofoldingWorkflow(FASTAWorkflow):
70
70
  """
71
- A workflow for predicting structures. Especially protein structures.
71
+ Workflow for predicting structures.
72
+
73
+ Especially protein structures. At least one biological sequence is required.
72
74
 
73
75
  Inherited:
74
76
  :param initial_protein_sequences: protein sequences of interest
77
+ :param initial_dna_sequences: DNA sequences of interest
78
+ :param initial_rna_sequences: RNA sequences of interest
75
79
  :param initial_smiles_list: SMILES strings of interest
76
80
 
77
81
  New:
@@ -0,0 +1,13 @@
1
+ """RNA-related workflow data models."""
2
+
3
+ from ..base import Base
4
+
5
+
6
+ class RNASequence(Base):
7
+ """
8
+ RNA sequence metadata.
9
+
10
+ :param sequence: nucleotide string
11
+ """
12
+
13
+ sequence: str
@@ -1,5 +1,7 @@
1
1
  """Base classes for workflows."""
2
2
 
3
+ from typing import Any
4
+
3
5
  from pydantic import field_validator
4
6
 
5
7
  from ..base import Base
@@ -7,6 +9,9 @@ from ..message import Message
7
9
  from ..mode import Mode
8
10
  from ..molecule import Molecule
9
11
  from ..types import UUID
12
+ from .dna import DNASequence
13
+ from .protein import ProteinSequence
14
+ from .rna import RNASequence
10
15
 
11
16
 
12
17
  class Workflow(Base):
@@ -22,31 +27,30 @@ class Workflow(Base):
22
27
  return repr(self)
23
28
 
24
29
 
25
- class ProteinSequence(Base):
26
- """
27
- Protein sequence metadata including cyclic flag.
28
-
29
- :param sequence: amino-acid sequence string
30
- :param cyclic: whether this sequence forms a cyclic peptide (defaults to False)
31
- """
32
-
33
- sequence: str
34
- cyclic: bool = False
35
-
36
-
37
30
  class FASTAWorkflow(Workflow):
38
31
  """
39
- Base class for Workflows that operate on protein sequences and SMILES.
32
+ Base class for Workflows that operate on biological sequences and SMILES.
40
33
 
41
- :param initial_protein_sequences: proteins to evaluate, either plain sequence strings or ProteinSequence objects with cyclic flags
34
+ :param initial_protein_sequences: protein sequences to evaluate, either plain sequence strings or ProteinSequence objects with metadata
35
+ :param initial_dna_sequences: DNA sequences to evaluate, either plain sequence strings or DNASequence objects with metadata
36
+ :param initial_rna_sequences: RNA sequences to evaluate, either plain sequence strings or RNASequence objects with metadata
42
37
  :param initial_smiles_list: SMILES strings of interest
43
38
  :param ligand_binding_affinity_index: optional index selecting which ligand affinity to evaluate
39
+ :raises ValueError: if none of the sequence lists are provided
44
40
  """
45
41
 
46
- initial_protein_sequences: list[ProteinSequence] | list[str]
47
- initial_smiles_list: list[str] | None = None
42
+ initial_protein_sequences: list[ProteinSequence] | list[str] = []
43
+ initial_dna_sequences: list[DNASequence] = []
44
+ initial_rna_sequences: list[RNASequence] = []
45
+ initial_smiles_list: list[str] = []
48
46
  ligand_binding_affinity_index: int | None = None
49
47
 
48
+ def model_post_init(self, __context: Any) -> None:
49
+ if not (self.initial_protein_sequences or self.initial_dna_sequences or self.initial_rna_sequences):
50
+ raise ValueError(
51
+ "Provide at least one of `initial_protein_sequences`, `initial_dna_sequences`, or `initial_rna_sequences`.",
52
+ )
53
+
50
54
 
51
55
  class SMILESWorkflow(Workflow):
52
56
  """
@@ -99,10 +103,10 @@ class ProteinSequenceWorkflow(Workflow):
99
103
  """
100
104
  Base class for Workflows that operate on protein sequences.
101
105
 
102
- :param initial_protein_sequences: protein sequences of interest
106
+ :param initial_protein_sequences: protein sequences to evaluate, either plain sequence strings or ProteinSequence objects with metadata
103
107
  """
104
108
 
105
- protein_sequences: list[str]
109
+ initial_protein_sequences: list[ProteinSequence] | list[str] = []
106
110
 
107
111
 
108
112
  class DBCalculation(Base):
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: stjames
3
- Version: 0.0.122
3
+ Version: 0.0.123
4
4
  Summary: standardized JSON atom/molecule encoding scheme
5
5
  Author-email: Corin Wagen <corin@rowansci.com>
6
6
  Project-URL: Homepage, https://github.com/rowansci/stjames
@@ -43,8 +43,9 @@ stjames/workflows/basic_calculation.py,sha256=wIiq2lFRN4nxN0__X_JbPSeaUeJ4tKUyg6
43
43
  stjames/workflows/batch_docking.py,sha256=o-t5FkfLlbe60jX1_ZeqWSJJ5vsjEIbTa5GLN3ny_tk,1590
44
44
  stjames/workflows/bde.py,sha256=g_In-caftXiimrhfdptHjpfrYQUs3vF58qYmRnaTN8g,10825
45
45
  stjames/workflows/conformer.py,sha256=18aO6ngMBeGAmQkBdLGCCHr398RIYr1v2hD2IT1u4cc,3005
46
- stjames/workflows/conformer_search.py,sha256=b3xbyFdulc8VLtk12a_v_zWaS_bkyi6cVVqNyTucD38,16544
46
+ stjames/workflows/conformer_search.py,sha256=TaDI3unNjaxBKj4YHASwSaNQHlVSwuZDZdTIxk7MC4Y,17638
47
47
  stjames/workflows/descriptors.py,sha256=T4tc7xdtBdxESGO86KR323jPQ2pgwxBqgV0khA6MEgQ,584
48
+ stjames/workflows/dna.py,sha256=_M79WikFujCsUWr4YaEdOoeDDKPV_DhKptWt0ptktko,194
48
49
  stjames/workflows/docking.py,sha256=t30kqeFXQ0yrlqvN6Jdwt0SdfnJLDsfK-7yFi0gwNbY,4753
49
50
  stjames/workflows/double_ended_ts_search.py,sha256=ovJgEVFc6c3mijCE3TKAY70YvqNmAZ5Y4XgV4-tIxBI,3127
50
51
  stjames/workflows/electronic_properties.py,sha256=GT3-NC7w-dbcOJ-3AzJ7LgzH6frTbiH2Iyb9BCa-SvY,4112
@@ -59,17 +60,19 @@ stjames/workflows/multistage_opt.py,sha256=UN-4WLsT2WEjO5KqDPrcCkb708Co-ZScHx3g2
59
60
  stjames/workflows/nmr.py,sha256=1QEF4SB6dWIr-jzLEZ7V972UnRUOTufOJSHwIGyV3dM,2681
60
61
  stjames/workflows/pka.py,sha256=i-jzl2lN0yRWc0tgrWSBCplITEByfRyEQrlUhjnzcBc,4580
61
62
  stjames/workflows/pose_analysis_md.py,sha256=dpWVKC-8fPdw6ExIXk9xbeVBDUMUYQECpixb-oFa23I,4803
63
+ stjames/workflows/protein.py,sha256=MfwJ3qn24cCoUEczMH7A2NyBlI9t_VcwOowohTPDtYM,346
62
64
  stjames/workflows/protein_binder_design.py,sha256=KnPKQJTMrSO5xfw64Bh7T0wHck1NtysVwkVgHs1cGws,12013
63
- stjames/workflows/protein_cofolding.py,sha256=w7Sg_ttU4bcJb7wlVcI_AAsLM9WVAJcU5ucbNb5Iyzw,4326
65
+ stjames/workflows/protein_cofolding.py,sha256=5rs6wgksW5zKpcEkv0_B4Clt9dSQ-42oKF8fJtSRoaY,4495
64
66
  stjames/workflows/redox_potential.py,sha256=7S18t9Y3eynSnA3lZbRlvLfdbgeBopdiigLzt1zxg5c,3871
67
+ stjames/workflows/rna.py,sha256=FZO3UkRhgG3EnGXsQ70eAZTbeEY2P9u60oLD6JuPPMc,194
65
68
  stjames/workflows/scan.py,sha256=lgpvrrFG03GWQj2tWeBqPQVYSCGLgYdnQsU9bAUZQok,3317
66
69
  stjames/workflows/solubility.py,sha256=lfCVvJjqEaddLUpK6WBxjB7u12Sci-K95A5_qIMkIRM,3028
67
70
  stjames/workflows/spin_states.py,sha256=0degmE-frovgoXweshZyjfjqL7nkbaFoO9YoJhvQnaI,4748
68
71
  stjames/workflows/strain.py,sha256=paYxDDQTB1eYP_c2kLVz1-QX7Vpw0LLb3ujnFin_SOM,1834
69
72
  stjames/workflows/tautomer.py,sha256=7eYKziGPg8Km6lfowTzSkgJfJ4SHUPrAmnTf8Bi-SB0,1164
70
- stjames/workflows/workflow.py,sha256=nwSX-KO2J9Lgd_uNuoYxS1Lv8rZB-jmTfphb8KJODC8,2720
71
- stjames-0.0.122.dist-info/licenses/LICENSE,sha256=i05z7xEhyrg6f8j0lR3XYjShnF-MJGFQ-DnpsZ8yiVI,1084
72
- stjames-0.0.122.dist-info/METADATA,sha256=9McsAFJMWpw8ymFCC3VTRWKU6cXslDyZKGvTHt1u7Og,1725
73
- stjames-0.0.122.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
74
- stjames-0.0.122.dist-info/top_level.txt,sha256=FYCwxl6quhYOAgG-mnPQcCK8vsVM7B8rIUrO-WrQ_PI,8
75
- stjames-0.0.122.dist-info/RECORD,,
73
+ stjames/workflows/workflow.py,sha256=dJYK9hY8FqNsD-foQsTI7Mpk2aTY87ASjMFgerx6gtQ,3432
74
+ stjames-0.0.123.dist-info/licenses/LICENSE,sha256=i05z7xEhyrg6f8j0lR3XYjShnF-MJGFQ-DnpsZ8yiVI,1084
75
+ stjames-0.0.123.dist-info/METADATA,sha256=r1v4SR_lfdasc-yuQRdmxI7nJXSnVKvbjQiMz4mwW54,1725
76
+ stjames-0.0.123.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
77
+ stjames-0.0.123.dist-info/top_level.txt,sha256=FYCwxl6quhYOAgG-mnPQcCK8vsVM7B8rIUrO-WrQ_PI,8
78
+ stjames-0.0.123.dist-info/RECORD,,