PyPI - molcraft - Versions diffs - 0.1.0a15__py3-none-any.whl → 0.1.0a17__py3-none-any.whl - Mend

molcraft 0.1.0a15py3-none-any.whl → 0.1.0a17py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of molcraft might be problematic. Click here for more details.

Files changed (21) hide show

molcraft/__init__.py +1 -2
molcraft/applications/chromatography.py +0 -0
molcraft/applications/proteomics.py +194 -0
molcraft/chem.py +17 -22
molcraft/datasets.py +6 -6
molcraft/descriptors.py +14 -0
molcraft/features.py +50 -58
molcraft/featurizers.py +257 -487
molcraft/layers.py +50 -0
molcraft/models.py +2 -0
molcraft/records.py +24 -15
{molcraft-0.1.0a15.dist-info → molcraft-0.1.0a17.dist-info}/METADATA +14 -12
molcraft-0.1.0a17.dist-info/RECORD +21 -0
molcraft/apps/peptides.py +0 -429
molcraft/apps/qsrr.py +0 -47
molcraft/conformers.py +0 -151
molcraft-0.1.0a15.dist-info/RECORD +0 -22
/molcraft/{apps → applications}/__init__.py +0 -0
{molcraft-0.1.0a15.dist-info → molcraft-0.1.0a17.dist-info}/WHEEL +0 -0
{molcraft-0.1.0a15.dist-info → molcraft-0.1.0a17.dist-info}/licenses/LICENSE +0 -0
{molcraft-0.1.0a15.dist-info → molcraft-0.1.0a17.dist-info}/top_level.txt +0 -0

molcraft/layers.py CHANGED Viewed

@@ -1430,6 +1430,56 @@ class EdgeEmbedding(GraphLayer):
         return config
+@keras.saving.register_keras_serializable(package='molcraft')
+class AddContext(GraphLayer):
+    """Context adding layer.
+    Adds context to super nodes.
+    """
+    def __init__(
+        self,
+        field: str = 'feature',
+        drop: bool = False,
+        normalize: bool = False,
+        **kwargs
+    ) -> None:
+        super().__init__(**kwargs)
+        self.field = field
+        self.drop = drop
+        self._normalize = normalize
+    def build(self, spec: tensors.GraphTensor.Spec) -> None:
+        feature_dim = spec.node['feature'].shape[-1]
+        self._context_dense = self.get_dense(feature_dim)
+        if not self._normalize:
+            self._norm = keras.layers.Identity()
+        elif str(self._normalize).lower().startswith('layer'):
+            self._norm = keras.layers.LayerNormalization()
+        else:
+            self._norm = keras.layers.BatchNormalization()
+    def propagate(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
+        context = tensor.context[self.field]
+        context = self._context_dense(context)
+        context = self._norm(context)
+        node_feature = ops.scatter_add(
+            tensor.node['feature'], tensor.node['super'], context
+        )
+        data = {'node': {'feature': node_feature}}
+        if self.drop:
+            data['context'] = {self.field: None}
+        return tensor.update(data)
+    def get_config(self) -> dict:
+        config = super().get_config()
+        config['field'] = self.field
+        config['drop'] = self.drop
+        config['normalize'] = self._normalize
+        return config
 @keras.saving.register_keras_serializable(package='molcraft')
 class GraphNetwork(GraphLayer):

molcraft/models.py CHANGED Viewed

@@ -154,6 +154,7 @@ class GraphModel(layers.GraphLayer, keras.models.Model):
         return graph
     def get_config(self):
+        """Obtain model config."""
         config = super().get_config()
         if hasattr(self, '_model_layers') and self._model_layers is not None:
             config['model_layers'] = [
@@ -164,6 +165,7 @@ class GraphModel(layers.GraphLayer, keras.models.Model):
     @classmethod
     def from_config(cls, config: dict):
+        """Obtain model from model config."""
         if 'model_layers' in config:
             config['model_layers'] = [
                 keras.saving.deserialize_keras_object(l)

molcraft/records.py CHANGED Viewed

@@ -14,7 +14,7 @@ from molcraft import featurizers
 def write(
     inputs: list[str | tuple],
-    featurizer: featurizers.Featurizer,
+    featurizer: featurizers.GraphFeaturizer,
     path: str,
     overwrite: bool = True,
     num_files: typing.Optional[int] = None,
@@ -23,10 +23,13 @@ def write(
     device: str = '/cpu:0'
 ) -> None:
-    if os.path.isdir(path) and not overwrite:
-        return
-    os.makedirs(path, exist_ok=True)
+    if os.path.isdir(path):
+        if not overwrite:
+            return
+        else:
+            _remove_files(path)
+    else:
+        os.makedirs(path)
     with tf.device(device):
@@ -133,7 +136,7 @@ def load_spec(path: str) -> tensors.GraphTensor.Spec:
 def _write_tfrecord(
     inputs,
     path: str,
-    featurizer: featurizers.Featurizer,
+    featurizer: featurizers.GraphFeaturizer,
 ) -> None:
     def _write_example(tensor):
@@ -149,11 +152,7 @@ def _write_tfrecord(
                 x = tuple(x)
             tensor = featurizer(x)
             if tensor is not None:
-                if isinstance(tensor, tensors.GraphTensor):
-                    _write_example(tensor)
-                else:
-                    for t in tensor:
-                        _write_example(t)
+                _write_example(tensor)
 def _serialize_example(
     feature: dict[str, tf.train.Feature]
@@ -168,8 +167,18 @@ def _parse_example(
 ) -> tf.Tensor:
     out = tf.io.parse_single_example(
         x, features={'feature': tf.io.RaggedFeature(tf.string)})['feature']
-    out = [tf.ensure_shape(tf.io.parse_tensor(x[0], s.dtype), s.shape) for (x, s) in zip(
-        tf.split(out, len(tf.nest.flatten(spec, expand_composites=True))),
-        tf.nest.flatten(spec, expand_composites=True))]
+    out = [
+        tf.ensure_shape(tf.io.parse_tensor(x[0], s.dtype), s.shape)
+        for (x, s) in zip(
+            tf.split(out, len(tf.nest.flatten(spec, expand_composites=True))),
+            tf.nest.flatten(spec, expand_composites=True)
+        )
+    ]
     out = tf.nest.pack_sequence_as(spec, tf.nest.flatten(out), expand_composites=True)
-    return out
+    return out
+def _remove_files(path):
+    for filename in os.listdir(path):
+        if filename.endswith('tfrecord') or filename == 'spec.pb':
+            filepath = os.path.join(path, filename)
+            os.remove(filepath)

{molcraft-0.1.0a15.dist-info → molcraft-0.1.0a17.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: molcraft
-Version: 0.1.0a15
+Version: 0.1.0a17
 Summary: Graph Neural Networks for Molecular Machine Learning
 Author-email: Alexander Kensert <alexander.kensert@gmail.com>
 License: MIT License
@@ -35,6 +35,7 @@ Requires-Python: >=3.10
 Description-Content-Type: text/markdown
 License-File: LICENSE
 Requires-Dist: tensorflow>=2.16
+Requires-Dist: tensorflow-text>=2.16
 Requires-Dist: rdkit>=2023.9.5
 Requires-Dist: pandas>=1.0.3
 Requires-Dist: ipython>=8.12.0
@@ -42,9 +43,9 @@ Provides-Extra: gpu
 Requires-Dist: tensorflow[and-cuda]>=2.16; extra == "gpu"
 Dynamic: license-file
-<img src="https://github.com/akensert/molcraft/blob/main/docs/_static/molcraft-logo.png" alt="molcraft-logo">
+<img src="https://github.com/akensert/molcraft/blob/main/docs/_static/molcraft-logo.png" alt="molcraft-logo", width="90%">
-**Deep Learning on Molecules**: A Minimalistic GNN package for Molecular ML.
+**Deep Learning on Molecules**: A Minimalistic GNN package for Molecular ML.
 > [!NOTE]
 > In progress.
@@ -82,11 +83,12 @@ featurizer = featurizers.MolGraphFeaturizer(
         features.BondType(),
         features.IsRotatable(),
     ],
-    super_atom=True,
+    super_node=True,
     self_loops=True,
+    include_hydrogens=False,
 )
-graph = featurizer([('N[C@@H](C)C(=O)O', 2.0), ('N[C@@H](CS)C(=O)O', 1.0)])
+graph = featurizer([('N[C@@H](C)C(=O)O', 2.5), ('N[C@@H](CS)C(=O)O', 1.5)])
 print(graph)
 model = models.GraphModel.from_layers(
@@ -94,13 +96,13 @@ model = models.GraphModel.from_layers(
         layers.Input(graph.spec),
         layers.NodeEmbedding(dim=128),
         layers.EdgeEmbedding(dim=128),
-        layers.GraphTransformer(units=128),
-        layers.GraphTransformer(units=128),
-        layers.GraphTransformer(units=128),
-        layers.GraphTransformer(units=128),
-        layers.Readout(mode='mean'),
-        keras.layers.Dense(units=1024, activation='relu'),
-        keras.layers.Dense(units=1024, activation='relu'),
+        layers.GraphConv(units=128),
+        layers.GraphConv(units=128),
+        layers.GraphConv(units=128),
+        layers.GraphConv(units=128),
+        layers.Readout(),
+        keras.layers.Dense(units=1024, activation='elu'),
+        keras.layers.Dense(units=1024, activation='elu'),
         keras.layers.Dense(1)
     ]
 )

molcraft-0.1.0a17.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,21 @@
+molcraft/__init__.py,sha256=vc-z1sgtzPY7Spwzkemu7I_b9ekEN9egnHrLEKbB9bk,431
+molcraft/callbacks.py,sha256=x5HnkZhqcFRrW6xdApt_jZ4X08A-0fxcnFKfdmRKa0c,3571
+molcraft/chem.py,sha256=e56qBDuqh8rq_4-UMyp6LCQNxxSx8hZ7gzuz-87DHgw,21652
+molcraft/datasets.py,sha256=Nd2lw5USUZE52vvAiNr-q-n03Y3--NlZlK0NzqHgp-E,4145
+molcraft/descriptors.py,sha256=Cl3KnBPsTST7XLgRLktkX5LwY9MV0P_lUlrt8iPV5no,3508
+molcraft/features.py,sha256=s0WeV8eZcDEypPgC1m37f4s9QkvWIlVgn-L43Cdsa14,13525
+molcraft/featurizers.py,sha256=bD3RFY9eg89-O-Nxgy6gote1zS4cyjOgzdSiSJZJdJE,17664
+molcraft/layers.py,sha256=Y-TMb4oHh3R7tHgr7f3Y8sEPDnoSTbtwB6NkZIVnmcA,61734
+molcraft/losses.py,sha256=qnS2yC5g-O3n_zVea9MR6TNiFraW2yqRgePOisoUP4A,1065
+molcraft/models.py,sha256=2Pc1htT9fCukGd8ZxrvE0rzEHsPBm0pluHw4FZXaUE4,21963
+molcraft/ops.py,sha256=bQbdFDt9waxVCzF5-dkTB6vlpj9eoSt8I4Qg7ZGXbsU,6178
+molcraft/records.py,sha256=0j4EWP55sfnkoQIH5trdaAIevPfVbAtPLrygTRmLyFw,5686
+molcraft/tensors.py,sha256=EOUKx496KUZsjA1zA2ABc7tU_TW3Jv7AXDsug_QsLbA,22407
+molcraft/applications/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+molcraft/applications/chromatography.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+molcraft/applications/proteomics.py,sha256=Jb7OwHJHc_I7Wk3qnqr40j9P7um2EKtUnB4r-XhrnAc,7180
+molcraft-0.1.0a17.dist-info/licenses/LICENSE,sha256=sbVeqlrtZ0V63uYhZGL5dCxUm8rBAOqe2avyA1zIQNk,1074
+molcraft-0.1.0a17.dist-info/METADATA,sha256=XqNJDwFfY6pWNqQKYLyUOxwyvmfYUkOWTKou-ZQYXL4,3930
+molcraft-0.1.0a17.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+molcraft-0.1.0a17.dist-info/top_level.txt,sha256=dENV6MfOceshM6MQCgJlcN1ojZkiCL9B4F7XyUge3QM,9
+molcraft-0.1.0a17.dist-info/RECORD,,

molcraft/apps/peptides.py DELETED Viewed

@@ -1,429 +0,0 @@
-import re
-import keras
-import numpy as np
-import tensorflow as tf
-import tensorflow_text as tf_text
-from rdkit import Chem
-from molcraft import ops
-from molcraft import chem
-from molcraft import features
-from molcraft import featurizers
-from molcraft import tensors
-from molcraft import descriptors
-from molcraft import layers
-from molcraft import models
-@keras.saving.register_keras_serializable(package='molcraft')
-class SequenceSplitter(keras.layers.Layer):
-    _pattern = "|".join([
-        r'(\[[A-Za-z0-9]+\]-[A-Z]\[[A-Za-z0-9]+\])', # N-term mod + mod
-        r'([A-Z]\[[A-Za-z0-9]+\]-\[[A-Za-z0-9]+\])', # C-term mod + mod
-        r'([A-Z]-\[[A-Za-z0-9]+\])', # C-term mod
-        r'(\[[A-Za-z0-9]+\]-[A-Z])', # N-term mod
-        r'([A-Z]\[[A-Za-z0-9]+\])', # Mod
-        r'([A-Z])', # No mod
-    ])
-    def call(self, inputs):
-        inputs = tf_text.regex_split(inputs, self._pattern, self._pattern)
-        inputs = keras.ops.concatenate([
-            tf.strings.join([inputs[:, :-1], '-[X]']),
-            inputs[:, -1:]
-        ], axis=1)
-        return inputs.to_tensor()
-@keras.saving.register_keras_serializable(package='molcraft')
-class Gather(keras.layers.Layer):
-    def __init__(
-        self,
-        padding: list[tuple[int]] | tuple[int] | int = 1,
-        mask_value: int = 0,
-        **kwargs
-    ) -> None:
-        super().__init__(**kwargs)
-        self._splitter = SequenceSplitter()
-        self.padding = padding
-        self.mask_value = mask_value
-        self.supports_masking = True
-        self._tags = list(sorted(residues.keys()))
-        self._mapping = tf.lookup.StaticHashTable(
-            tf.lookup.KeyValueTensorInitializer(
-                keys=self._tags,
-                values=range(len(self._tags)),
-            ),
-            default_value=-1,
-        )
-    def get_config(self):
-        config = super().get_config()
-        config['mask_value'] = self.mask_value
-        config['padding'] = self.padding
-        return config
-    def call(self, inputs) -> tf.Tensor:
-        embedding, sequence = inputs
-        sequence = self._splitter(sequence)
-        sequence = self._mapping.lookup(sequence)
-        readout = ops.gather(embedding, keras.ops.where(sequence == -1, 0, sequence))
-        readout = keras.ops.where(sequence[..., None] == -1, 0.0, readout)
-        return readout
-    def compute_mask(
-        self,
-        inputs: tensors.GraphTensor,
-        mask: bool | None = None
-    ) -> tf.Tensor | None:
-        # if self.mask_value is None:
-        #     return None
-        _, sequence = inputs
-        sequence = self._splitter(sequence)
-        return keras.ops.not_equal(sequence, '')
-@keras.saving.register_keras_serializable(package='molcraft')
-class Embedding(keras.layers.Layer):
-    def __init__(self, **kwargs):
-        super().__init__(**kwargs)
-        tags = list(sorted(residues.keys()))
-        self.mapping = tf.lookup.StaticHashTable(
-            tf.lookup.KeyValueTensorInitializer(
-                keys=tags,
-                values=range(len(tags)),
-            ),
-            default_value=-1,
-        )
-        self.splitting = SequenceSplitter()
-        featurizer = featurizers.MolGraphFeaturizer(super_atom=True)
-        tensor_list = [featurizer(residues[tag]) for tag in tags]
-        graph = tf.stack(tensor_list, axis=0)
-        self._build_on_init(graph)
-        self.embedder = models.GraphModel.from_layers(
-            [
-                layers.Input(graph.spec),
-                layers.NodeEmbedding(128),
-                layers.EdgeEmbedding(128),
-                layers.GraphTransformer(128),
-                layers.Readout()
-            ]
-        )
-        self.embedding = tf.Variable(
-            initial_value=tf.zeros((114, 128)), trainable=True
-        )
-        self.new_state = tf.Variable(True, dtype=tf.bool, trainable=False)
-        self.gather = Gather()
-        self.update_state()
-        # Keep AA as is (most simple?), add positional embedding to distingusih N-, C- and non-terminal
-    def update_state(self, inputs=None):
-        graph = self._graph_tensor
-        graph = tensors.to_dict(graph)
-        embedding = self.embedder(graph)
-        self.embedding.assign(embedding)
-        tf.print("STATE UPDATED")
-        return embedding
-    def call(self, inputs=None, training=None) -> tensors.GraphTensor:
-        if training:
-            embedding = self.update_state()
-            self.new_state.assign(True)
-            return self.gather([embedding, inputs])
-        else:
-            embedding = tf.cond(
-                pred=self.new_state,
-                true_fn=lambda: self.update_state(),
-                false_fn=lambda: self.embedding
-            )
-            self.new_state.assign(False)
-            return self.gather([embedding, inputs])
-    def build(self, input_shape):
-        super().build(input_shape)
-    def _build_on_init(self, x):
-        if isinstance(x, tensors.GraphTensor):
-            tensor = tensors.to_dict(x)
-            self._spec = tf.nest.map_structure(
-                tf.type_spec_from_value, tensor
-            )
-        else:
-            self._spec = x
-        self._graph = tf.nest.map_structure(
-            lambda s: self.add_weight(
-                shape=s.shape,
-                dtype=s.dtype,
-                trainable=False,
-                initializer='zeros'
-            ),
-            self._spec
-        )
-        if isinstance(x, tensors.GraphTensor):
-            tf.nest.map_structure(
-                lambda v, x: v.assign(x),
-                self._graph, tensor
-            )
-        graph = tf.nest.map_structure(
-            keras.ops.convert_to_tensor, self._graph
-        )
-        self._graph_tensor = tensors.from_dict(graph)
-    # def get_config(self) -> dict:
-    #     config = super().get_config()
-    #     spec = keras.saving.serialize_keras_object(self._spec)
-    #     config['spec'] = spec
-    #     #config['layers'] = keras.saving.serialize_keras_object(self.embedding.layers)
-    #     return config
-    # @classmethod
-    # def from_config(cls, config: dict) -> 'SequenceToGraph':
-    #     spec = config.pop('spec')
-    #     spec = keras.saving.deserialize_keras_object(spec)
-    #    # config['layers'] = keras.saving.deserialize_keras_object(config['layers'])
-    #     layer = cls(**config)
-    #     layer._build_on_init(spec)
-    #     return layer
-@keras.saving.register_keras_serializable(package='molcraft')
-class SequenceToGraph(keras.layers.Layer):
-    def __init__(
-        self,
-        atom_features: list[features.Feature] | str | None = 'auto',
-        bond_features: list[features.Feature] | str | None = 'auto',
-        molecule_features: list[descriptors.Descriptor] | str | None = 'auto',
-        super_atom: bool = True,
-        radius: int | float | None = None,
-        self_loops: bool = False,
-        include_hs: bool = False,
-        **kwargs,
-    ):
-        super().__init__(**kwargs)
-        self._splitter = SequenceSplitter()
-        featurizer = featurizers.MolGraphFeaturizer(
-            atom_features=atom_features,
-            bond_features=bond_features,
-            molecule_features=molecule_features,
-            super_atom=super_atom,
-            radius=radius,
-            self_loops=self_loops,
-            include_hs=include_hs,
-            **kwargs,
-        )
-        tensor_list: list[tensors.GraphTensor] = [
-            featurizer(residues[tag]).update({'context': {'tag': tag}}) for tag in residues
-        ]
-        graph = tf.stack(tensor_list, axis=0)
-        self._build_on_init(graph)
-    def call(self, sequence: tf.Tensor) -> tensors.GraphTensor:
-        sequence = self._splitter(sequence)
-        indices = self._tag_to_index.lookup(sequence)
-        indices = tf.sort(tf.unique(tf.reshape(indices, [-1]))[0])[1:]
-        graph = self._graph_tensor[indices]
-        return tensors.to_dict(graph)
-    def _build_on_init(self, x):
-        if isinstance(x, tensors.GraphTensor):
-            tensor = tensors.to_dict(x)
-            self._spec = tf.nest.map_structure(
-                tf.type_spec_from_value, tensor
-            )
-        else:
-            self._spec = x
-        self._graph = tf.nest.map_structure(
-            lambda s: self.add_weight(
-                shape=s.shape,
-                dtype=s.dtype,
-                trainable=False,
-                initializer='zeros'
-            ),
-            self._spec
-        )
-        if isinstance(x, tensors.GraphTensor):
-            tf.nest.map_structure(
-                lambda v, x: v.assign(x),
-                self._graph, tensor
-            )
-        graph = tf.nest.map_structure(
-            keras.ops.convert_to_tensor, self._graph
-        )
-        self._graph_tensor = tensors.from_dict(graph)
-        tags = self._graph_tensor.context['tag']
-        self._tag_to_index = tf.lookup.StaticHashTable(
-            tf.lookup.KeyValueTensorInitializer(
-                keys=tags,
-                values=range(len(tags)),
-            ),
-            default_value=-1,
-        )
-    def get_config(self) -> dict:
-        config = super().get_config()
-        spec = keras.saving.serialize_keras_object(self._spec)
-        config['spec'] = spec
-        return config
-    @classmethod
-    def from_config(cls, config: dict) -> 'SequenceToGraph':
-        spec = config.pop('spec')
-        spec = keras.saving.deserialize_keras_object(spec)
-        layer = cls(**config)
-        layer._build_on_init(spec)
-        return layer
-    # @property
-    # def graph(self) -> tensors.GraphTensor:
-    #     return self._graph_tensor
-@keras.saving.register_keras_serializable(package='molcraft')
-class GraphToSequence(keras.layers.Layer):
-    def __init__(
-        self,
-        padding: list[tuple[int]] | tuple[int] | int = 1,
-        mask_value: int = 0,
-        **kwargs
-    ) -> None:
-        super().__init__(**kwargs)
-        self._splitter = SequenceSplitter()
-        self.padding = padding
-        self.mask_value = mask_value
-        self._readout_layer = layers.Readout(mode='mean')
-        self.supports_masking = True
-    def get_config(self):
-        config = super().get_config()
-        config['mask_value'] = self.mask_value
-        config['padding'] = self.padding
-        return config
-    def call(self, inputs) -> tf.Tensor:
-        graph, sequence = inputs
-        sequence = self._splitter(sequence)
-        tag = graph['context']['tag']
-        data = self._readout_layer(graph)
-        table = tf.lookup.experimental.MutableHashTable(
-            key_dtype=tf.string,
-            value_dtype=tf.int32,
-            default_value=-1
-        )
-        table.insert(tag, tf.range(tf.shape(tag)[0]))
-        sequence = table.lookup(sequence)
-        readout = ops.gather(data, keras.ops.where(sequence == -1, 0, sequence))
-        readout = keras.ops.where(sequence[..., None] == -1, 0.0, readout)
-        return readout
-    def compute_mask(
-        self,
-        inputs: tensors.GraphTensor,
-        mask: bool | None = None
-    ) -> tf.Tensor | None:
-        # if self.mask_value is None:
-        #     return None
-        _, sequence = inputs
-        sequence = self._splitter(sequence)
-        return keras.ops.not_equal(sequence, '')
-residues = {
-    "A": "N[C@@H](C)C(=O)O",
-    "C": "N[C@@H](CS)C(=O)O",
-    "C[Carbamidomethyl]": "N[C@@H](CSCC(=O)N)C(=O)O",
-    "D": "N[C@@H](CC(=O)O)C(=O)O",
-    "E": "N[C@@H](CCC(=O)O)C(=O)O",
-    "F": "N[C@@H](Cc1ccccc1)C(=O)O",
-    "G": "NCC(=O)O",
-    "H": "N[C@@H](CC1=CN=C-N1)C(=O)O",
-    "I": "N[C@@H](C(CC)C)C(=O)O",
-    "K": "N[C@@H](CCCCN)C(=O)O",
-    "K[Acetyl]": "N[C@@H](CCCCNC(=O)C)C(=O)O",
-    "K[Crotonyl]": "N[C@@H](CCCCNC(C=CC)=O)C(=O)O",
-    "K[Dimethyl]": "N[C@@H](CCCCN(C)C)C(=O)O",
-    "K[Formyl]": "N[C@@H](CCCCNC=O)C(=O)O",
-    "K[Malonyl]": "N[C@@H](CCCCNC(=O)CC(O)=O)C(=O)O",
-    "K[Methyl]": "N[C@@H](CCCCNC)C(=O)O",
-    "K[Propionyl]": "N[C@@H](CCCCNC(=O)CC)C(=O)O",
-    "K[Succinyl]": "N[C@@H](CCCCNC(CCC(O)=O)=O)C(=O)O",
-    "K[Trimethyl]": "N[C@@H](CCCC[N+](C)(C)C)C(=O)O",
-    "L": "N[C@@H](CC(C)C)C(=O)O",
-    "M": "N[C@@H](CCSC)C(=O)O",
-    "M[Oxidation]": "N[C@@H](CCS(=O)C)C(=O)O",
-    "N": "N[C@@H](CC(=O)N)C(=O)O",
-    "P": "N1[C@@H](CCC1)C(=O)O",
-    "P[Oxidation]": "N1CC(O)C[C@H]1C(=O)O",
-    "Q": "N[C@@H](CCC(=O)N)C(=O)O",
-    "R": "N[C@@H](CCCNC(=N)N)C(=O)O",
-    "R[Deamidated]": "N[C@@H](CCCNC(N)=O)C(=O)O",
-    "R[Dimethyl]": "N[C@@H](CCCNC(N(C)C)=N)C(=O)O",
-    "R[Methyl]": "N[C@@H](CCCNC(=N)NC)C(=O)O",
-    "S": "N[C@@H](CO)C(=O)O",
-    "T": "N[C@@H](C(O)C)C(=O)O",
-    "V": "N[C@@H](C(C)C)C(=O)O",
-    "W": "N[C@@H](CC(=CN2)C1=C2C=CC=C1)C(=O)O",
-    "Y": "N[C@@H](Cc1ccc(O)cc1)C(=O)O",
-    "Y[Nitro]": "N[C@@H](Cc1ccc(O)c(N(=O)=O)c1)C(=O)O",
-    "Y[Phospho]": "N[C@@H](Cc1ccc(OP(O)(=O)O)cc1)C(=O)O",
-    "[Acetyl]-A": "N(C(C)=O)[C@@H](C)C(=O)O",
-    "[Acetyl]-C": "N(C(C)=O)[C@@H](CS)C(=O)O",
-    "[Acetyl]-D": "N(C(=O)C)[C@H](C(=O)O)CC(=O)O",
-    "[Acetyl]-E": "N(C(=O)C)[C@@H](CCC(O)=O)C(=O)O",
-    "[Acetyl]-F": "N(C(C)=O)[C@@H](Cc1ccccc1)C(=O)O",
-    "[Acetyl]-G": "N(C(=O)C)CC(=O)O",
-    "[Acetyl]-H": "N(C(=O)C)[C@@H](Cc1[nH]cnc1)C(=O)O",
-    "[Acetyl]-I": "N(C(=O)C)[C@@H]([C@H](CC)C)C(=O)O",
-    "[Acetyl]-K": "N(C(C)=O)[C@@H](CCCCN)C(=O)O",
-    "[Acetyl]-L": "N(C(=O)C)[C@@H](CC(C)C)C(=O)O",
-    "[Acetyl]-M": "N(C(=O)C)[C@@H](CCSC)C(=O)O",
-    "[Acetyl]-N": "N(C(C)=O)[C@@H](CC(=O)N)C(=O)O",
-    "[Acetyl]-P": "N1(C(=O)C)CCC[C@H]1C(=O)O",
-    "[Acetyl]-Q": "N(C(=O)C)[C@@H](CCC(=O)N)C(=O)O",
-    "[Acetyl]-R": "N(C(C)=O)[C@@H](CCCN=C(N)N)C(=O)O",
-    "[Acetyl]-S": "N(C(C)=O)[C@@H](CO)C(=O)O",
-    "[Acetyl]-T": "N(C(=O)C)[C@@H]([C@H](O)C)C(=O)O",
-    "[Acetyl]-V": "N(C(=O)C)[C@@H](C(C)C)C(=O)O",
-    "[Acetyl]-W": "N(C(C)=O)[C@@H](Cc1c2ccccc2[nH]c1)C(=O)O",
-    "[Acetyl]-Y": "N(C(C)=O)[C@@H](Cc1ccc(O)cc1)C(=O)O"
-}
-residues_reverse = {}
-def register_peptide_residues(residues_: dict[str, str], canonicalize=True):
-    for residue, smiles in residues_.items():
-        if canonicalize:
-            smiles = Chem.MolToSmiles(Chem.MolFromSmiles(smiles))
-        residues[residue] = smiles
-        residues_reverse[residues[residue]] = residue
-register_peptide_residues(residues, canonicalize=False)
-def _extract_residue_type(residue_tag: str) -> str:
-    pattern = r"(?<!\[)[A-Z](?![^\[]*\])"
-    return [match.group(0) for match in re.finditer(pattern, residue_tag)][0]
-special_residues = {}
-for key, value in residues.items():
-    special_residues[key + '-[X]'] = value.rstrip('O')
-register_peptide_residues(special_residues, canonicalize=False)

molcraft 0.1.0a15__py3-none-any.whl → 0.1.0a17__py3-none-any.whl

Potentially problematic release.

molcraft 0.1.0a15py3-none-any.whl → 0.1.0a17py3-none-any.whl