PyPI - molcraft - Versions diffs - 0.1.0a5__py3-none-any.whl → 0.1.0a7__py3-none-any.whl - Mend

molcraft 0.1.0a5py3-none-any.whl → 0.1.0a7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of molcraft might be problematic. Click here for more details.

Files changed (17) hide show

molcraft/__init__.py +3 -2
molcraft/callbacks.py +60 -0
molcraft/chem.py +103 -21
molcraft/conformers.py +1 -5
molcraft/featurizers.py +20 -14
molcraft/layers.py +307 -211
molcraft/losses.py +36 -0
molcraft/models.py +135 -9
molcraft/ops.py +12 -2
molcraft/records.py +32 -31
molcraft/tensors.py +1 -1
{molcraft-0.1.0a5.dist-info → molcraft-0.1.0a7.dist-info}/METADATA +4 -17
molcraft-0.1.0a7.dist-info/RECORD +19 -0
{molcraft-0.1.0a5.dist-info → molcraft-0.1.0a7.dist-info}/WHEEL +1 -1
molcraft-0.1.0a5.dist-info/RECORD +0 -18
{molcraft-0.1.0a5.dist-info → molcraft-0.1.0a7.dist-info}/licenses/LICENSE +0 -0
{molcraft-0.1.0a5.dist-info → molcraft-0.1.0a7.dist-info}/top_level.txt +0 -0

molcraft/layers.py CHANGED Viewed

@@ -125,23 +125,45 @@ class GraphLayer(keras.layers.Layer):
             return tensors.to_dict(outputs)
         return outputs
-    def __call__(self, inputs, **kwargs):
+    def __call__(
+        self,
+        graph: dict[str, dict[str, tf.Tensor]] | tensors.GraphTensor,
+        **kwargs
+    ) -> tf.Tensor | dict[str, dict[str, tf.Tensor]] | tensors.GraphTensor:
         if not self.built:
-            spec = _spec_from_inputs(inputs)
+            spec = _spec_from_inputs(graph)
             self.build(spec)
-        convert = isinstance(inputs, tensors.GraphTensor)
-        if convert:
-            inputs = tensors.to_dict(inputs)
+        is_graph_tensor = isinstance(graph, tensors.GraphTensor)
+        if is_graph_tensor:
+            graph = tensors.to_dict(graph)
+        else:
+            graph = {field: dict(data) for (field, data) in graph.items()}
         if isinstance(self, functional.Functional):
-            inputs, left_out_inputs = _match_functional_input(self.input, inputs)
-        outputs = super().__call__(inputs, **kwargs)
+            # As a functional model is strict for what input can
+            # be passed to it, we need to temporarily pop some of the
+            # input and add it afterwards.
+            label = graph['context'].pop('label', None)
+            weight = graph['context'].pop('weight', None)
+            tf.nest.assert_same_structure(self.input, graph)
+        outputs = super().__call__(graph, **kwargs)
         if not tensors.is_graph(outputs):
             return outputs
+        graph = outputs
         if isinstance(self, functional.Functional):
-            outputs = _add_left_out_inputs(outputs, left_out_inputs)
-        if convert:
-            outputs = tensors.from_dict(outputs)
-        return outputs
+            if label is not None:
+                graph['context']['label'] = label
+            if weight is not None:
+                graph['context']['weight'] = weight
+        if is_graph_tensor:
+            return tensors.from_dict(graph)
+        return graph
     def get_build_config(self) -> dict:
         if self._custom_build_config:
@@ -256,10 +278,10 @@ class GraphConv(GraphLayer):
             Default to `None`.
         use_bias (bool):
             Whether bias should be used in dense layers. Default to `True`.
-        normalization (bool, str):
+        normalize (bool, str):
             Whether `LayerNormalization` should be applied to the final node feature output.
             To use `BatchNormalization`, specify `batch_norm`. Default to `False`.
-        skip_connection (bool, str):
+        skip_connect (bool, str):
             Whether node feature input should be added to the node feature output.
             If node feature input dim is not equal to `units` (node feature output dim),
             a projection layer will automatically project the residual before adding it
@@ -294,14 +316,14 @@ class GraphConv(GraphLayer):
         units: int = None,
         activation: str | keras.layers.Activation | None = None,
         use_bias: bool = True,
-        normalization: bool | str = False,
-        skip_connection: bool | str = True,
+        normalize: bool | str = False,
+        skip_connect: bool | str = True,
         **kwargs
     ) -> None:
         super().__init__(use_bias=use_bias, **kwargs)
         self._units = units
-        self._normalization = normalization
-        self._skip_connection = skip_connection
+        self._normalize = normalize
+        self._skip_connect = skip_connect
         self._activation = keras.activations.get(activation)
     def __init_subclass__(cls, **kwargs):
@@ -319,36 +341,6 @@ class GraphConv(GraphLayer):
     def units(self):
         return self._units
-    def propagate(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
-        """Forward pass.
-        Invokes `message(graph)`, `aggregate(graph)` and `update(graph)` in sequence.
-        Arguments:
-            tensor:
-                A `GraphTensor` instance.
-        """
-        if self._skip_connection:
-            input_node_feature = tensor.node['feature']
-            if self._project_input_node_feature:
-                input_node_feature = self._residual_projection(input_node_feature)
-        tensor = self.message(tensor)
-        tensor = self.aggregate(tensor)
-        tensor = self.update(tensor)
-        updated_node_feature = tensor.node['feature']
-        if self._skip_connection:
-            if self._use_weighted_skip_connection:
-                input_node_feature *= self._skip_connection_weight
-            updated_node_feature += input_node_feature
-        if self._normalization:
-            updated_node_feature = self._output_norm(updated_node_feature)
-        return tensor.update({'node': {'feature': updated_node_feature}})
     def build(self, spec: tensors.GraphTensor.Spec) -> None:
         if not self.units:
             raise ValueError(
@@ -356,11 +348,11 @@ class GraphConv(GraphLayer):
             )
         node_feature_dim = spec.node['feature'].shape[-1]
         self._project_input_node_feature = (
-            self._skip_connection and (node_feature_dim != self.units)
+            self._skip_connect and (node_feature_dim != self.units)
         )
         if self._project_input_node_feature:
             warn(
-                '`skip_connection` is set to `True`, but found incompatible dim '
+                '`skip_connect` is set to `True`, but found incompatible dim '
                 'between input (node feature dim) and output (`self.units`). '
                 'Automatically applying a projection layer to residual to '
                 'match input and output. '
@@ -369,8 +361,8 @@ class GraphConv(GraphLayer):
                 self.units, name='residual_projection'
             )
-        skip_connection = str(self._skip_connection).lower()
-        self._use_weighted_skip_connection = skip_connection.startswith('weight')
+        skip_connect = str(self._skip_connect).lower()
+        self._use_weighted_skip_connection = skip_connect.startswith('weight')
         if self._use_weighted_skip_connection:
             self._skip_connection_weight = self.add_weight(
                 name='skip_connection_weight',
@@ -379,8 +371,8 @@ class GraphConv(GraphLayer):
                 trainable=True,
             )
-        if self._normalization:
-            if str(self._normalization).lower().startswith('batch'):
+        if self._normalize:
+            if str(self._normalize).lower().startswith('batch'):
                 self._output_norm = keras.layers.BatchNormalization(
                     name='output_batch_norm'
                 )
@@ -389,7 +381,7 @@ class GraphConv(GraphLayer):
                     name='output_layer_norm'
                 )
-        self._has_edge_feature = 'edge' in spec.edge
+        self._has_edge_feature = 'feature' in spec.edge
         has_overridden_message = self.__class__.message != GraphConv.message
         if not has_overridden_message:
@@ -400,6 +392,50 @@ class GraphConv(GraphLayer):
             self._output_dense = self.get_dense(self.units)
             self._output_activation = self._activation
+    def propagate(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
+        """Forward pass.
+        Invokes `message(graph)`, `aggregate(graph)` and `update(graph)` in sequence.
+        Arguments:
+            tensor:
+                A `GraphTensor` instance.
+        """
+        if self._skip_connect:
+            input_node_feature = tensor.node['feature']
+            if self._project_input_node_feature:
+                input_node_feature = self._residual_projection(input_node_feature)
+        message = self.message(tensor)
+        if not isinstance(message, tensors.GraphTensor):
+            message = tensor.update({'edge': {'message': message}})
+        elif not 'message' in message.edge:
+            raise ValueError('Could not find `message` in `edge` output.')
+        aggregate = self.aggregate(message)
+        if not isinstance(aggregate, tensors.GraphTensor):
+            aggregate = tensor.update({'node': {'aggregate': aggregate}})
+        elif not 'aggregate' in aggregate.node:
+            raise ValueError('Could not find `aggregate` in `node` output.')
+        update = self.update(aggregate)
+        if not isinstance(update, tensors.GraphTensor):
+            update = tensor.update({'node': {'feature': update}})
+        elif not 'feature' in update.node:
+            raise ValueError('Could not find `feature` in `node` output.')
+        updated_node_feature = update.node['feature']
+        if self._skip_connect:
+            if self._use_weighted_skip_connection:
+                input_node_feature *= self._skip_connection_weight
+            updated_node_feature += input_node_feature
+        if self._normalize:
+            updated_node_feature = self._output_norm(updated_node_feature)
+        return update.update({'node': {'feature': updated_node_feature}})
     def message(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
         """Compute messages.
@@ -441,8 +477,7 @@ class GraphConv(GraphLayer):
         return tensor.update(
             {
                 'node': {
-                    'feature': aggregate,
-                    'previous_feature': tensor.node['feature']
+                    'aggregate': aggregate,
                 },
                 'edge': {
                     'message': None
@@ -460,23 +495,20 @@ class GraphConv(GraphLayer):
                 A `GraphTensor` instance containing aggregated messages
                 (updated node features).
         """
-        if not 'previous_feature' in tensor.node:
-            feature = tensor.node['feature']
-        else:
-            feature = keras.ops.concatenate(
-                [
-                    tensor.node['feature'],
-                    tensor.node['previous_feature']
-                ],
-                axis=-1
-            )
+        feature = keras.ops.concatenate(
+            [
+                tensor.node['aggregate'],
+                tensor.node['feature']
+            ],
+            axis=-1
+        )
         update = self._output_dense(feature)
         update = self._output_activation(update)
         return tensor.update(
             {
                 'node': {
                     'feature': update,
-                    'previous_feature': None,
+                    'aggregate': None,
                 }
             }
         )
@@ -486,8 +518,8 @@ class GraphConv(GraphLayer):
         config.update({
             'units': self.units,
             'activation': keras.activations.serialize(self._activation),
-            'normalization': self._normalization,
-            'skip_connection': self._skip_connection,
+            'normalize': self._normalize,
+            'skip_connect': self._skip_connect,
         })
         return config
@@ -530,14 +562,14 @@ class GIConv(GraphConv):
         units: int,
         activation: keras.layers.Activation | str | None = 'relu',
         use_bias: bool = True,
-        normalization: bool = False,
+        normalize: bool = False,
         update_edge_feature: bool = True,
         **kwargs,
     ):
         super().__init__(
             units=units,
             activation=activation,
-            normalization=normalization,
+            normalize=normalize,
             use_bias=use_bias,
             **kwargs
         )
@@ -599,7 +631,7 @@ class GIConv(GraphConv):
         return tensor.update(
             {
                 'node': {
-                    'feature': node_feature,
+                    'aggregate': node_feature,
                 },
                 'edge': {
                     'message': None,
@@ -608,7 +640,7 @@ class GIConv(GraphConv):
         )
     def update(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
-        node_feature = tensor.node['feature']
+        node_feature = tensor.node['aggregate']
         node_feature = self._feedforward_intermediate_dense(node_feature)
         node_feature = self._feedforward_activation(node_feature)
         node_feature = self._feedforward_output_dense(node_feature)
@@ -616,6 +648,7 @@ class GIConv(GraphConv):
             {
                 'node': {
                     'feature': node_feature,
+                    'aggregate': None,
                 }
             }
         )
@@ -667,17 +700,16 @@ class GAConv(GraphConv):
         heads: int = 8,
         activation: keras.layers.Activation | str | None = "relu",
         use_bias: bool = True,
-        normalization: bool = False,
+        normalize: bool = False,
         update_edge_feature: bool = True,
         attention_activation: keras.layers.Activation | str | None = "leaky_relu",
         **kwargs,
     ) -> None:
-        kwargs['skip_connection'] = False
         super().__init__(
             units=units,
             activation=activation,
             use_bias=use_bias,
-            normalization=normalization,
+            normalize=normalize,
             **kwargs
         )
         self._heads = heads
@@ -753,11 +785,11 @@ class GAConv(GraphConv):
         )
         node_feature = self._node_dense(tensor.node['feature'])
         message = ops.gather(node_feature, tensor.edge['source'])
+        message = ops.edge_weight(message, attention_score)
         return tensor.update(
             {
                 'edge': {
                     'message': message,
-                    'weight': attention_score,
                     'feature': edge_feature,
                 }
             }
@@ -770,24 +802,24 @@ class GAConv(GraphConv):
         return tensor.update(
             {
                 'node': {
-                    'feature': node_feature
+                    'aggregate': node_feature
                 },
                 'edge': {
                     'message': None,
-                    'weight': None,
                 }
             }
         )
     def update(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
-        node_feature = tensor.node['feature']
+        node_feature = tensor.node['aggregate']
         node_feature = self._feedforward_intermediate_dense(node_feature)
         node_feature = self._feedforward_activation(node_feature)
         node_feature = self._feedforward_output_dense(node_feature)
         return tensor.update(
             {
                 'node': {
-                    'feature': node_feature
+                    'feature': node_feature,
+                    'aggregate': None,
                 }
             }
         )
@@ -842,7 +874,7 @@ class GTConv(GraphConv):
         heads: int = 8,
         activation: keras.layers.Activation | str | None = "relu",
         use_bias: bool = True,
-        normalization: bool = False,
+        normalize: bool = False,
         attention_dropout: float = 0.0,
         **kwargs,
     ) -> None:
@@ -850,7 +882,7 @@ class GTConv(GraphConv):
             units=units,
             activation=activation,
             use_bias=use_bias,
-            normalization=normalization,
+            normalize=normalize,
             **kwargs
         )
         self._heads = heads
@@ -901,7 +933,6 @@ class GTConv(GraphConv):
                     }
                 }
             )
         node_feature = tensor.node['feature']
         query = self._query_dense(node_feature)
@@ -918,12 +949,12 @@ class GTConv(GraphConv):
         attention_score += keras.ops.expand_dims(tensor.edge['bias'], axis=1)
         attention = ops.edge_softmax(attention_score, tensor.edge['target'])
         attention = self._softmax_dropout(attention)
+        message = ops.edge_weight(value, attention)
         return tensor.update(
             {
                 'edge': {
-                    'message': value,
-                    'weight': attention,
+                    'message': message
                 },
             }
         )
@@ -935,18 +966,16 @@ class GTConv(GraphConv):
         return tensor.update(
             {
                 'node': {
-                    'feature': node_feature,
-                    'residual': tensor.node['feature']
+                    'aggregate': node_feature,
                 },
                 'edge': {
                     'message': None,
-                    'weight': None,
                 }
             }
         )
     def update(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
-        node_feature = tensor.node['feature']
+        node_feature = tensor.node['aggregate']
         node_feature = self._feedforward_intermediate_dense(node_feature)
         node_feature = self._feedforward_activation(node_feature)
         node_feature = self._feedforward_output_dense(node_feature)
@@ -954,6 +983,7 @@ class GTConv(GraphConv):
             {
                 'node': {
                     'feature': node_feature,
+                    'aggregate': None,
                 },
             }
         )
@@ -978,14 +1008,14 @@ class MPConv(GraphConv):
         units: int = 128,
         activation: keras.layers.Activation | str | None = None,
         use_bias: bool = True,
-        normalization: bool = False,
+        normalize: bool = False,
         **kwargs
     ) -> None:
         super().__init__(
             units=units,
             activation=activation,
             use_bias=use_bias,
-            normalization=normalization,
+            normalize=normalize,
             **kwargs
         )
@@ -1032,28 +1062,28 @@ class MPConv(GraphConv):
     def aggregate(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
         aggregate = tensor.aggregate('message', mode='mean')
-        previous = tensor.node['feature']
+        feature = tensor.node['feature']
         if self.project_input_node_feature:
-            previous = self._previous_node_dense(previous)
+            feature = self._previous_node_dense(feature)
         return tensor.update(
             {
                 'node': {
-                    'feature': aggregate,
-                    'previous_feature': previous,
+                    'aggregate': aggregate,
+                    'feature': feature,
                 }
             }
         )
     def update(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
         updated_node_feature, _ = self.update_fn(
-            inputs=tensor.node['feature'],
-            states=tensor.node['previous_feature']
+            inputs=tensor.node['aggregate'],
+            states=tensor.node['feature']
         )
         return tensor.update(
             {
                 'node': {
                     'feature': updated_node_feature,
-                    'previous_feature': None,
+                    'aggregate': None,
                 }
             }
         )
@@ -1124,12 +1154,13 @@ class GTConv3D(GTConv):
         attention *= keras.ops.expand_dims(distance, axis=-1)
         attention = keras.ops.expand_dims(attention, axis=2)
         value = keras.ops.expand_dims(value, axis=1)
+        message = ops.edge_weight(value, attention)
         return tensor.update(
             {
                 'edge': {
-                    'message': value,
-                    'weight': attention,
+                    'message': message,
                 },
             }
         )
@@ -1144,12 +1175,10 @@ class GTConv3D(GTConv):
         return tensor.update(
             {
                 'node': {
-                    'feature': node_feature,
-                    'residual': tensor.node['feature']
+                    'aggregate': node_feature,
                 },
                 'edge': {
                     'message': None,
-                    'weight': None,
                 }
             }
         )
@@ -1202,16 +1231,16 @@ class EGConv3D(GraphConv):
     def __init__(
         self,
         units: int = 128,
-        activation: keras.layers.Activation | str | None = None,
+        activation: keras.layers.Activation | str | None = 'silu',
         use_bias: bool = True,
-        normalization: bool = False,
+        normalize: bool = False,
         **kwargs
     ) -> None:
         super().__init__(
             units=units,
             activation=activation,
             use_bias=use_bias,
-            normalization=normalization,
+            normalize=normalize,
             **kwargs
         )
@@ -1222,31 +1251,52 @@ class EGConv3D(GraphConv):
                 'which is required for Conv3D layers.'
             )
         self._has_edge_feature = 'feature' in spec.edge
-        self.message_fn = self.get_dense(self.units, activation=self._activation)
-        self.dense_position = self.get_dense(1)
+        self._message_feedforward_intermediate = self.get_dense(
+            self.units, activation=self._activation
+        )
+        self._message_feedforward_final = self.get_dense(
+            self.units, activation=self._activation
+        )
+        self._coord_feedforward_intermediate = self.get_dense(
+            self.units, activation=self._activation
+        )
+        self._coord_feedforward_final = self.get_dense(
+            1, use_bias=False, activation='tanh'
+        )
         has_overridden_update = self.__class__.update != EGConv3D.update
         if not has_overridden_update:
-            self.update_fn = self.get_dense(self.units, activation=self._activation)
-            self.output_dense = self.get_dense(self.units)
+            self._feedforward_intermediate = self.get_dense(
+                self.units, activation=self._activation
+            )
+            self._feedforward_output = self.get_dense(self.units)
     def message(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
         relative_node_coordinate = keras.ops.subtract(
             tensor.gather('coordinate', 'target'),
             tensor.gather('coordinate', 'source')
         )
-        euclidean_distance = keras.ops.sum(
-            keras.ops.square(
-                relative_node_coordinate
-            ),
+        squared_distance = keras.ops.sum(
+            keras.ops.square(relative_node_coordinate),
             axis=-1,
             keepdims=True
         )
+        # For numerical stability (i.e., to prevent NaN losses), this implementation of `EGConv3D`
+        # either needs to apply a `tanh` activation to the output of `self._coord_feedforward_final`,
+        # or normalize `relative_node_cordinate` as follows:
+        #
+        # norm = keras.ops.sqrt(squared_distance) + keras.backend.epsilon()
+        # relative_node_coordinate /= norm
+        #
+        # For now, this implementation does the former.
         feature = keras.ops.concatenate(
             [
                 tensor.gather('feature', 'target'),
                 tensor.gather('feature', 'source'),
-                euclidean_distance,
+                squared_distance,
             ],
             axis=-1
         )
@@ -1258,10 +1308,15 @@ class EGConv3D(GraphConv):
                 ],
                 axis=-1
             )
-        message = self.message_fn(feature)
+        message = self._message_feedforward_final(
+            self._message_feedforward_intermediate(feature)
+        )
         relative_node_coordinate = keras.ops.multiply(
-            relative_node_coordinate,
-            self.dense_position(message)
+            relative_node_coordinate,
+            self._coord_feedforward_final(
+                self._coord_feedforward_intermediate(message)
+            )
         )
         return tensor.update(
             {
@@ -1273,27 +1328,26 @@ class EGConv3D(GraphConv):
         )
     def aggregate(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
-        coefficient = keras.ops.bincount(
-            tensor.edge['source'],
-            minlength=tensor.num_nodes
-        )
-        coefficient = keras.ops.cast(
-            coefficient, tensor.node['coordinate'].dtype
-        )
-        coefficient = keras.ops.expand_dims(
-            keras.ops.divide_no_nan(1, coefficient), axis=1
-        )
+        coordinate = tensor.node['coordinate']
+        coordinate += tensor.aggregate('relative_node_coordinate', mode='mean')
+        # Original implementation seems to apply sum aggregation, which does not
+        # seem work well for this implementation of `EGConv3D`, as it causes
+        # large output values and large initial losses. The magnitude of the
+        # aggregated values of a sum aggregation depends on the number of
+        # neighbors, which may be many and may differ from node to node (or
+        # graph to graph). Therefore, a mean mean aggregation is performed
+        # instead:
+        aggregate = tensor.aggregate('message', mode='mean')
-        updated_coordinate = tensor.aggregate('relative_node_coordinate') * coefficient
-        updated_coordinate += tensor.node['coordinate']
+        # Simply added to silence warning ('no gradients for variables ...')
+        aggregate += (0.0 * keras.ops.sum(coordinate))
-        aggregate = tensor.aggregate('message', mode='mean')
         return tensor.update(
             {
                 'node': {
-                    'feature': aggregate,
-                    'coordinate': updated_coordinate,
-                    'previous_feature': tensor.node['feature'],
+                    'aggregate': aggregate,
+                    'coordinate': coordinate,
                 },
                 'edge': {
                     'message': None,
@@ -1303,21 +1357,21 @@ class EGConv3D(GraphConv):
         )
     def update(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
-        updated_node_feature = self.update_fn(
-            keras.ops.concatenate(
-                [
-                    tensor.node['feature'],
-                    tensor.node['previous_feature']
-                ],
-                axis=-1
-            )
+        feature = keras.ops.concatenate(
+            [
+                tensor.node['aggregate'],
+                tensor.node['feature']
+            ],
+            axis=-1
+        )
+        updated_node_feature = self._feedforward_output(
+            self._feedforward_intermediate(feature)
         )
-        updated_node_feature = self.output_dense(updated_node_feature)
         return tensor.update(
             {
                 'node': {
                     'feature': updated_node_feature,
-                    'previous_feature': None,
+                    'aggregate': None,
                 },
             }
         )
@@ -1478,6 +1532,32 @@ class GraphNetwork(GraphLayer):
         return super().from_config(config)
+@keras.saving.register_keras_serializable(package='molcraft')
+class Extraction(GraphLayer):
+    def __init__(
+        self,
+        field: str,
+        inner_field: str | None = None,
+        **kwargs
+    ) -> None:
+        super().__init__(**kwargs)
+        self.field = field
+        self.inner_field = inner_field
+    def propagate(self, tensor: tensors.GraphTensor) -> tensors.GraphTensor:
+        data = dict(getattr(tensor, self.field))
+        if not self.inner_field:
+            return data
+        return data[self.inner_field]
+    def get_config(self):
+        config = super().get_config()
+        config['field'] = self.field
+        config['inner_field'] = self.inner_field
+        return config
 @keras.saving.register_keras_serializable(package='molcraft')
 class NodeEmbedding(GraphLayer):
@@ -1489,15 +1569,15 @@ class NodeEmbedding(GraphLayer):
     def __init__(
         self,
         dim: int = None,
-        normalization: bool = False,
-        embed_context: bool = True,
+        normalize: bool = False,
+        embed_context: bool = False,
         allow_reconstruction: bool = False,
-        allow_masking: bool = True,
+        allow_masking: bool = False,
         **kwargs
     ) -> None:
         super().__init__(**kwargs)
         self.dim = dim
-        self._normalization = normalization
+        self._normalize = normalize
         self._embed_context = embed_context
         self._masking_rate = None
         self._allow_masking = allow_masking
@@ -1517,13 +1597,11 @@ class NodeEmbedding(GraphLayer):
             self._super_feature = self.get_weight(shape=[self.dim], name='super_node_feature')
         if self._allow_masking:
             self._mask_feature = self.get_weight(shape=[self.dim], name='mask_node_feature')
         if self._embed_context:
-            context_feature_dim = spec.context['feature'].shape[-1]
             self._context_dense = self.get_dense(self.dim)
-        if self._normalization:
-            if str(self._normalization).lower().startswith('batch'):
+        if self._normalize:
+            if str(self._normalize).lower().startswith('batch'):
                 self._norm = keras.layers.BatchNormalization(
                     name='output_batch_norm'
                 )
@@ -1545,48 +1623,25 @@ class NodeEmbedding(GraphLayer):
             feature = ops.scatter_update(feature, tensor.node['super'], context_feature)
             tensor = tensor.update({'context': {'feature': None}})
-        if (
-            self._allow_masking and
-            self._masking_rate is not None and
-            self._masking_rate > 0
-        ):
-            random = keras.random.uniform(shape=[tensor.num_nodes])
-            mask = random <= self._masking_rate
-            if self._has_super:
-                mask = keras.ops.logical_and(
-                    mask, keras.ops.logical_not(tensor.node['super'])
-                )
-            mask = keras.ops.expand_dims(mask, -1)
+        apply_mask = (self._allow_masking and 'mask' in tensor.node)
+        if apply_mask:
+            mask = keras.ops.expand_dims(tensor.node['mask'], -1)
             feature = keras.ops.where(mask, self._mask_feature, feature)
         elif self._allow_masking:
-            # Slience warning of 'no gradients for variables'
             feature = feature + (self._mask_feature * 0.0)
-        if self._normalization:
+        if self._normalize:
             feature = self._norm(feature)
         if not self._allow_reconstruction:
             return tensor.update({'node': {'feature': feature}})
         return tensor.update({'node': {'feature': feature, 'target_feature': feature}})
-    @property
-    def masking_rate(self):
-        return self._masking_rate
-    @masking_rate.setter
-    def masking_rate(self, rate: float):
-        if not self._allow_masking and rate is not None:
-            raise ValueError(
-                f'Cannot set `masking_rate` for layer {self} '
-                'as `allow_masking` was set to `False`.'
-            )
-        self._masking_rate = float(rate)
     def get_config(self) -> dict:
         config = super().get_config()
         config.update({
             'dim': self.dim,
-            'normalization': self._normalization,
+            'normalize': self._normalize,
             'embed_context': self._embed_context,
             'allow_masking': self._allow_masking,
             'allow_reconstruction': self._allow_reconstruction,
@@ -1605,13 +1660,13 @@ class EdgeEmbedding(GraphLayer):
     def __init__(
         self,
         dim: int = None,
-        normalization: bool = False,
+        normalize: bool = False,
         allow_masking: bool = True,
         **kwargs
     ) -> None:
         super().__init__(**kwargs)
         self.dim = dim
-        self._normalization = normalization
+        self._normalize = normalize
         self._masking_rate = None
         self._allow_masking = allow_masking
@@ -1622,13 +1677,16 @@ class EdgeEmbedding(GraphLayer):
         self._edge_dense = self.get_dense(self.dim)
         self._has_super = 'super' in spec.edge
+        self._has_self_loop = 'self_loop' in spec.edge
         if self._has_super:
             self._super_feature = self.get_weight(shape=[self.dim], name='super_edge_feature')
+        if self._has_self_loop:
+            self._self_loop_feature = self.get_weight(shape=[self.dim], name='self_loop_edge_feature')
         if self._allow_masking:
             self._mask_feature = self.get_weight(shape=[self.dim], name='mask_edge_feature')
-        if self._normalization:
-            if str(self._normalization).lower().startswith('batch'):
+        if self._normalize:
+            if str(self._normalize).lower().startswith('batch'):
                 self._norm = keras.layers.BatchNormalization(
                     name='output_batch_norm'
                 )
@@ -1641,10 +1699,13 @@ class EdgeEmbedding(GraphLayer):
         feature = self._edge_dense(tensor.edge['feature'])
         if self._has_super:
-            super_feature = self._super_feature
             super_mask = keras.ops.expand_dims(tensor.edge['super'], 1)
-            feature = keras.ops.where(super_mask, super_feature, feature)
+            feature = keras.ops.where(super_mask, self._super_feature, feature)
+        if self._has_self_loop:
+            self_loop_mask = keras.ops.expand_dims(tensor.edge['self_loop'], 1)
+            feature = keras.ops.where(self_loop_mask, self._self_loop_feature, feature)
         if (
             self._allow_masking and
             self._masking_rate is not None and
@@ -1659,10 +1720,10 @@ class EdgeEmbedding(GraphLayer):
             mask = keras.ops.expand_dims(mask, -1)
             feature = keras.ops.where(mask, self._mask_feature, feature)
         elif self._allow_masking:
-            # Slience warning of 'no gradients for variables'
-            feature = feature + (self._mask_feature * 0.0)
+            # Simply added to silence warning ('no gradients for variables ...')
+            feature += (0.0 * self._mask_feature)
-        if self._normalization:
+        if self._normalize:
             feature = self._norm(feature)
         return tensor.update({'edge': {'feature': feature, 'embedding': feature}})
@@ -1684,7 +1745,7 @@ class EdgeEmbedding(GraphLayer):
         config = super().get_config()
         config.update({
             'dim': self.dim,
-            'normalization': self._normalization,
+            'normalize': self._normalize,
             'allow_masking': self._allow_masking
         })
         return config
@@ -1883,6 +1944,56 @@ class GaussianDistance(GraphLayer):
         return config
+@keras.saving.register_keras_serializable(package='molcraft')
+class GaussianParams(keras.layers.Dense):
+    '''Gaussian parameters.
+    Computes loc and scale via a dense layer. Should be implemented
+    as the last layer in a model and paired with `losses.GaussianNLL`.
+    The loc and scale parameters (resulting from this layer) are concatenated
+    together along the last axis, resulting in a single output tensor.
+    Args:
+        events (int):
+            The number of events. If the model makes a single prediction per example,
+            then the number of events should be 1. If the model makes multiple predictions
+            per example, then the number of events should be greater than 1.
+            Default to 1.
+        kwargs:
+            See `keras.layers.Dense` documentation. `activation` will be applied
+            to `loc` only. `scale` is automatically softplus activated.
+    '''
+    def __init__(self, events: int = 1, **kwargs):
+        units = kwargs.pop('units', None)
+        activation = kwargs.pop('activation', None)
+        if units:
+            if units % 2 != 0:
+                raise ValueError(
+                    '`units` needs to be divisble by 2 as `units` = 2 x `events`.'
+                )
+        else:
+            units = int(events * 2)
+        super().__init__(units=units, **kwargs)
+        self.events = events
+        self.loc_activation = keras.activations.get(activation)
+    def call(self, inputs, **kwargs):
+        loc_and_scale = super().call(inputs, **kwargs)
+        loc = loc_and_scale[..., :self.events]
+        scale = loc_and_scale[..., self.events:]
+        scale = keras.ops.softplus(scale) + keras.backend.epsilon()
+        loc = self.loc_activation(loc)
+        return keras.ops.concatenate([loc, scale], axis=-1)
+    def get_config(self):
+        config = super().get_config()
+        config['events'] = self.events
+        config['units'] = None
+        config['activation'] = keras.activations.serialize(self.loc_activation)
+        return config
 def Input(spec: tensors.GraphTensor.Spec) -> dict:
     """Used to specify inputs to model.
@@ -1914,9 +2025,11 @@ def Input(spec: tensors.GraphTensor.Spec) -> dict:
     for outer_field, data in spec.__dict__.items():
         inputs[outer_field] = {}
         for inner_field, nested_spec in data.items():
-            if inner_field in ['label', 'weight']:
-                if outer_field == 'context':
-                    continue
+            if outer_field == 'context' and inner_field in ['label', 'weight']:
+                # Remove context label and weight from the symbolic input
+                # as a functional model is strict for what input can be passed.
+                # (We want to train and predict with the model.)
+                continue
             kwargs = {
                 'shape': nested_spec.shape[1:],
                 'dtype': nested_spec.dtype,
@@ -1941,23 +2054,6 @@ def warn(message: str) -> None:
         stacklevel=1
     )
-def _match_functional_input(functional_input, inputs):
-    matching_inputs = {}
-    for outer_field, data in functional_input.items():
-        matching_inputs[outer_field] = {}
-        for inner_field, _ in data.items():
-            call_input = inputs[outer_field].pop(inner_field)
-            matching_inputs[outer_field][inner_field] = call_input
-    unmatching_inputs = inputs
-    return matching_inputs, unmatching_inputs
-def _add_left_out_inputs(outputs, inputs):
-    for outer_field, data in inputs.items():
-        for inner_field, value in data.items():
-            if inner_field in ['label', 'weight']:
-                outputs[outer_field][inner_field] = value
-    return outputs
 def _serialize_spec(spec: tensors.GraphTensor.Spec) -> dict:
     serialized_spec = {}
     for outer_field, data in spec.__dict__.items():

molcraft 0.1.0a5__py3-none-any.whl → 0.1.0a7__py3-none-any.whl

Potentially problematic release.

molcraft 0.1.0a5py3-none-any.whl → 0.1.0a7py3-none-any.whl