PyPI - brainstate - Versions diffs - 0.1.8__py2.py3-none-any.whl → 0.1.9__py2.py3-none-any.whl - Mend

brainstate 0.1.8py2.py3-none-any.whl → 0.1.9py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (133) hide show

brainstate/__init__.py +58 -51
brainstate/_compatible_import.py +148 -148
brainstate/_state.py +1605 -1663
brainstate/_state_test.py +52 -52
brainstate/_utils.py +47 -47
brainstate/augment/__init__.py +30 -30
brainstate/augment/_autograd.py +778 -778
brainstate/augment/_autograd_test.py +1289 -1289
brainstate/augment/_eval_shape.py +99 -99
brainstate/augment/_eval_shape_test.py +38 -38
brainstate/augment/_mapping.py +1060 -1060
brainstate/augment/_mapping_test.py +597 -597
brainstate/augment/_random.py +151 -151
brainstate/compile/__init__.py +38 -38
brainstate/compile/_ad_checkpoint.py +204 -204
brainstate/compile/_ad_checkpoint_test.py +49 -49
brainstate/compile/_conditions.py +256 -256
brainstate/compile/_conditions_test.py +220 -220
brainstate/compile/_error_if.py +92 -92
brainstate/compile/_error_if_test.py +52 -52
brainstate/compile/_jit.py +346 -346
brainstate/compile/_jit_test.py +143 -143
brainstate/compile/_loop_collect_return.py +536 -536
brainstate/compile/_loop_collect_return_test.py +58 -58
brainstate/compile/_loop_no_collection.py +184 -184
brainstate/compile/_loop_no_collection_test.py +50 -50
brainstate/compile/_make_jaxpr.py +888 -888
brainstate/compile/_make_jaxpr_test.py +156 -156
brainstate/compile/_progress_bar.py +202 -202
brainstate/compile/_unvmap.py +159 -159
brainstate/compile/_util.py +147 -147
brainstate/environ.py +563 -563
brainstate/environ_test.py +62 -62
brainstate/functional/__init__.py +27 -26
brainstate/graph/__init__.py +29 -29
brainstate/graph/_graph_node.py +244 -244
brainstate/graph/_graph_node_test.py +73 -73
brainstate/graph/_graph_operation.py +1738 -1738
brainstate/graph/_graph_operation_test.py +563 -563
brainstate/init/__init__.py +26 -26
brainstate/init/_base.py +52 -52
brainstate/init/_generic.py +244 -244
brainstate/init/_random_inits.py +553 -553
brainstate/init/_random_inits_test.py +149 -149
brainstate/init/_regular_inits.py +105 -105
brainstate/init/_regular_inits_test.py +50 -50
brainstate/mixin.py +365 -363
brainstate/mixin_test.py +77 -73
brainstate/nn/__init__.py +135 -131
brainstate/{functional → nn}/_activations.py +808 -813
brainstate/{functional → nn}/_activations_test.py +331 -331
brainstate/nn/_collective_ops.py +514 -514
brainstate/nn/_collective_ops_test.py +43 -43
brainstate/nn/_common.py +178 -178
brainstate/nn/_conv.py +501 -501
brainstate/nn/_conv_test.py +238 -238
brainstate/nn/_delay.py +509 -502
brainstate/nn/_delay_test.py +238 -184
brainstate/nn/_dropout.py +426 -426
brainstate/nn/_dropout_test.py +100 -100
brainstate/nn/_dynamics.py +1343 -1343
brainstate/nn/_dynamics_test.py +78 -78
brainstate/nn/_elementwise.py +1119 -1119
brainstate/nn/_elementwise_test.py +169 -169
brainstate/nn/_embedding.py +58 -58
brainstate/nn/_exp_euler.py +92 -92
brainstate/nn/_exp_euler_test.py +35 -35
brainstate/nn/_fixedprob.py +239 -239
brainstate/nn/_fixedprob_test.py +114 -114
brainstate/nn/_inputs.py +608 -608
brainstate/nn/_linear.py +424 -424
brainstate/nn/_linear_mv.py +83 -83
brainstate/nn/_linear_mv_test.py +120 -120
brainstate/nn/_linear_test.py +107 -107
brainstate/nn/_ltp.py +28 -28
brainstate/nn/_module.py +377 -377
brainstate/nn/_module_test.py +40 -40
brainstate/nn/_neuron.py +705 -705
brainstate/nn/_neuron_test.py +161 -161
brainstate/nn/_normalizations.py +975 -918
brainstate/nn/_normalizations_test.py +73 -73
brainstate/{functional → nn}/_others.py +46 -46
brainstate/nn/_poolings.py +1177 -1177
brainstate/nn/_poolings_test.py +217 -217
brainstate/nn/_projection.py +486 -486
brainstate/nn/_rate_rnns.py +554 -554
brainstate/nn/_rate_rnns_test.py +63 -63
brainstate/nn/_readout.py +209 -209
brainstate/nn/_readout_test.py +53 -53
brainstate/nn/_stp.py +236 -236
brainstate/nn/_synapse.py +505 -505
brainstate/nn/_synapse_test.py +131 -131
brainstate/nn/_synaptic_projection.py +423 -423
brainstate/nn/_synouts.py +162 -162
brainstate/nn/_synouts_test.py +57 -57
brainstate/nn/_utils.py +89 -89
brainstate/nn/metrics.py +388 -388
brainstate/optim/__init__.py +38 -38
brainstate/optim/_base.py +64 -64
brainstate/optim/_lr_scheduler.py +448 -448
brainstate/optim/_lr_scheduler_test.py +50 -50
brainstate/optim/_optax_optimizer.py +152 -152
brainstate/optim/_optax_optimizer_test.py +53 -53
brainstate/optim/_sgd_optimizer.py +1104 -1104
brainstate/random/__init__.py +24 -24
brainstate/random/_rand_funs.py +3616 -3616
brainstate/random/_rand_funs_test.py +567 -567
brainstate/random/_rand_seed.py +210 -210
brainstate/random/_rand_seed_test.py +48 -48
brainstate/random/_rand_state.py +1409 -1409
brainstate/random/_random_for_unit.py +52 -52
brainstate/surrogate.py +1957 -1957
brainstate/transform.py +23 -23
brainstate/typing.py +304 -304
brainstate/util/__init__.py +50 -50
brainstate/util/caller.py +98 -98
brainstate/util/error.py +55 -55
brainstate/util/filter.py +469 -469
brainstate/util/others.py +540 -540
brainstate/util/pretty_pytree.py +945 -945
brainstate/util/pretty_pytree_test.py +159 -159
brainstate/util/pretty_repr.py +328 -328
brainstate/util/pretty_table.py +2954 -2954
brainstate/util/scaling.py +258 -258
brainstate/util/struct.py +523 -523
{brainstate-0.1.8.dist-info → brainstate-0.1.9.dist-info}/METADATA +91 -99
brainstate-0.1.9.dist-info/RECORD +130 -0
{brainstate-0.1.8.dist-info → brainstate-0.1.9.dist-info}/WHEEL +1 -1
{brainstate-0.1.8.dist-info → brainstate-0.1.9.dist-info/licenses}/LICENSE +202 -202
brainstate/functional/_normalization.py +0 -81
brainstate/functional/_spikes.py +0 -204
brainstate-0.1.8.dist-info/RECORD +0 -132
{brainstate-0.1.8.dist-info → brainstate-0.1.9.dist-info}/top_level.txt +0 -0

brainstate/nn/_conv.py CHANGED Viewed

@@ -1,501 +1,501 @@
-# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-# -*- coding: utf-8 -*-
-import collections.abc
-from typing import Callable, Tuple, Union, Sequence, Optional, TypeVar
-import jax
-import jax.numpy as jnp
-from brainstate import init, functional
-from brainstate._state import ParamState
-from brainstate.typing import ArrayLike
-from ._module import Module
-T = TypeVar('T')
-__all__ = [
-    'Conv1d', 'Conv2d', 'Conv3d',
-    'ScaledWSConv1d', 'ScaledWSConv2d', 'ScaledWSConv3d',
-]
-def to_dimension_numbers(
-    num_spatial_dims: int,
-    channels_last: bool,
-    transpose: bool
-) -> jax.lax.ConvDimensionNumbers:
-    """Create a `lax.ConvDimensionNumbers` for the given inputs."""
-    num_dims = num_spatial_dims + 2
-    if channels_last:
-        spatial_dims = tuple(range(1, num_dims - 1))
-        image_dn = (0, num_dims - 1) + spatial_dims
-    else:
-        spatial_dims = tuple(range(2, num_dims))
-        image_dn = (0, 1) + spatial_dims
-    if transpose:
-        kernel_dn = (num_dims - 2, num_dims - 1) + tuple(range(num_dims - 2))
-    else:
-        kernel_dn = (num_dims - 1, num_dims - 2) + tuple(range(num_dims - 2))
-    return jax.lax.ConvDimensionNumbers(lhs_spec=image_dn,
-                                        rhs_spec=kernel_dn,
-                                        out_spec=image_dn)
-def replicate(
-    element: Union[T, Sequence[T]],
-    num_replicate: int,
-    name: str,
-) -> Tuple[T, ...]:
-    """Replicates entry in `element` `num_replicate` if needed."""
-    if isinstance(element, (str, bytes)) or not isinstance(element, collections.abc.Sequence):
-        return (element,) * num_replicate
-    elif len(element) == 1:
-        return tuple(list(element) * num_replicate)
-    elif len(element) == num_replicate:
-        return tuple(element)
-    else:
-        raise TypeError(f"{name} must be a scalar or sequence of length 1 or "
-                        f"sequence of length {num_replicate}.")
-class _BaseConv(Module):
-    # the number of spatial dimensions
-    num_spatial_dims: int
-    # the weight and its operations
-    weight: ParamState
-    def __init__(
-        self,
-        in_size: Sequence[int],
-        out_channels: int,
-        kernel_size: Union[int, Tuple[int, ...]],
-        stride: Union[int, Tuple[int, ...]] = 1,
-        padding: Union[str, int, Tuple[int, int], Sequence[Tuple[int, int]]] = 'SAME',
-        lhs_dilation: Union[int, Tuple[int, ...]] = 1,
-        rhs_dilation: Union[int, Tuple[int, ...]] = 1,
-        groups: int = 1,
-        w_mask: Optional[Union[ArrayLike, Callable]] = None,
-        name: str = None,
-    ):
-        super().__init__(name=name)
-        # general parameters
-        assert self.num_spatial_dims + 1 == len(in_size)
-        self.in_size = tuple(in_size)
-        self.in_channels = in_size[-1]
-        self.out_channels = out_channels
-        self.stride = replicate(stride, self.num_spatial_dims, 'stride')
-        self.kernel_size = replicate(kernel_size, self.num_spatial_dims, 'kernel_size')
-        self.lhs_dilation = replicate(lhs_dilation, self.num_spatial_dims, 'lhs_dilation')
-        self.rhs_dilation = replicate(rhs_dilation, self.num_spatial_dims, 'rhs_dilation')
-        self.groups = groups
-        self.dimension_numbers = to_dimension_numbers(self.num_spatial_dims, channels_last=True, transpose=False)
-        # the padding parameter
-        if isinstance(padding, str):
-            assert padding in ['SAME', 'VALID']
-        elif isinstance(padding, int):
-            padding = tuple((padding, padding) for _ in range(self.num_spatial_dims))
-        elif isinstance(padding, (tuple, list)):
-            if isinstance(padding[0], int):
-                padding = (padding,) * self.num_spatial_dims
-            elif isinstance(padding[0], (tuple, list)):
-                if len(padding) == 1:
-                    padding = tuple(padding) * self.num_spatial_dims
-                else:
-                    if len(padding) != self.num_spatial_dims:
-                        raise ValueError(
-                            f"Padding {padding} must be a Tuple[int, int], "
-                            f"or sequence of Tuple[int, int] with length 1, "
-                            f"or sequence of Tuple[int, int] with length {self.num_spatial_dims}."
-                        )
-                    padding = tuple(padding)
-        else:
-            raise ValueError
-        self.padding = padding
-        # the number of in-/out-channels
-        assert self.out_channels % self.groups == 0, '"out_channels" should be divisible by groups'
-        assert self.in_channels % self.groups == 0, '"in_channels" should be divisible by groups'
-        # kernel shape and w_mask
-        kernel_shape = tuple(self.kernel_size) + (self.in_channels // self.groups, self.out_channels)
-        self.kernel_shape = kernel_shape
-        self.w_mask = init.param(w_mask, kernel_shape, allow_none=True)
-    def _check_input_dim(self, x):
-        if x.ndim == self.num_spatial_dims + 2:
-            x_shape = x.shape[1:]
-        elif x.ndim == self.num_spatial_dims + 1:
-            x_shape = x.shape
-        else:
-            raise ValueError(f"expected {self.num_spatial_dims + 2}D (with batch) or "
-                             f"{self.num_spatial_dims + 1}D (without batch) input (got {x.ndim}D input, {x.shape})")
-        if self.in_size != x_shape:
-            raise ValueError(f"The expected input shape is {self.in_size}, while we got {x_shape}.")
-    def update(self, x):
-        self._check_input_dim(x)
-        non_batching = False
-        if x.ndim == self.num_spatial_dims + 1:
-            x = jnp.expand_dims(x, 0)
-            non_batching = True
-        y = self._conv_op(x, self.weight.value)
-        return y[0] if non_batching else y
-    def _conv_op(self, x, params):
-        raise NotImplementedError
-    def __repr__(self):
-        return (f'{self.__class__.__name__}('
-                f'in_channels={self.in_channels}, '
-                f'out_channels={self.out_channels}, '
-                f'kernel_size={self.kernel_size}, '
-                f'stride={self.stride}, '
-                f'padding={self.padding}, '
-                f'groups={self.groups})')
-class _Conv(_BaseConv):
-    num_spatial_dims: int = None
-    def __init__(
-        self,
-        in_size: Sequence[int],
-        out_channels: int,
-        kernel_size: Union[int, Tuple[int, ...]],
-        stride: Union[int, Tuple[int, ...]] = 1,
-        padding: Union[str, int, Tuple[int, int], Sequence[Tuple[int, int]]] = 'SAME',
-        lhs_dilation: Union[int, Tuple[int, ...]] = 1,
-        rhs_dilation: Union[int, Tuple[int, ...]] = 1,
-        groups: int = 1,
-        w_init: Union[Callable, ArrayLike] = init.XavierNormal(),
-        b_init: Optional[Union[Callable, ArrayLike]] = None,
-        w_mask: Optional[Union[ArrayLike, Callable]] = None,
-        name: str = None,
-        param_type: type = ParamState,
-    ):
-        super().__init__(
-            in_size=in_size,
-            out_channels=out_channels,
-            kernel_size=kernel_size,
-            stride=stride,
-            padding=padding,
-            lhs_dilation=lhs_dilation,
-            rhs_dilation=rhs_dilation,
-            groups=groups,
-            w_mask=w_mask,
-            name=name
-        )
-        self.w_initializer = w_init
-        self.b_initializer = b_init
-        # --- weights --- #
-        weight = init.param(self.w_initializer, self.kernel_shape, allow_none=False)
-        params = dict(weight=weight)
-        if self.b_initializer is not None:
-            bias_shape = (1,) * len(self.kernel_size) + (self.out_channels,)
-            bias = init.param(self.b_initializer, bias_shape, allow_none=True)
-            params['bias'] = bias
-        # The weight operation
-        self.weight = param_type(params)
-        # Evaluate the output shape
-        abstract_y = jax.eval_shape(
-            self._conv_op,
-            jax.ShapeDtypeStruct((128,) + self.in_size, weight.dtype),
-            params
-        )
-        y_shape = abstract_y.shape[1:]
-        self.out_size = y_shape
-    def _conv_op(self, x, params):
-        w = params['weight']
-        if self.w_mask is not None:
-            w = w * self.w_mask
-        y = jax.lax.conv_general_dilated(
-            lhs=x,
-            rhs=w,
-            window_strides=self.stride,
-            padding=self.padding,
-            lhs_dilation=self.lhs_dilation,
-            rhs_dilation=self.rhs_dilation,
-            feature_group_count=self.groups,
-            dimension_numbers=self.dimension_numbers
-        )
-        if 'bias' in params:
-            y = y + params['bias']
-        return y
-class Conv1d(_Conv):
-    """One-dimensional convolution.
-    The input should be a 3d array with the shape of ``[B, H, C]``.
-    Parameters
-    ----------
-    %s
-    """
-    __module__ = 'brainstate.nn'
-    num_spatial_dims: int = 1
-class Conv2d(_Conv):
-    """Two-dimensional convolution.
-    The input should be a 4d array with the shape of ``[B, H, W, C]``.
-    Parameters
-    ----------
-    %s
-    """
-    __module__ = 'brainstate.nn'
-    num_spatial_dims: int = 2
-class Conv3d(_Conv):
-    """Three-dimensional convolution.
-    The input should be a 5d array with the shape of ``[B, H, W, D, C]``.
-    Parameters
-    ----------
-    %s
-    """
-    __module__ = 'brainstate.nn'
-    num_spatial_dims: int = 3
-_conv_doc = '''
-  in_size: tuple of int
-    The input shape, without the batch size. This argument is important, since it is
-    used to evaluate the shape of the output.
-  out_channels: int
-    The number of output channels.
-  kernel_size: int, sequence of int
-    The shape of the convolutional kernel.
-    For 1D convolution, the kernel size can be passed as an integer.
-    For all other cases, it must be a sequence of integers.
-  stride: int, sequence of int
-    An integer or a sequence of `n` integers, representing the inter-window strides (default: 1).
-  padding: str, int, sequence of int, sequence of tuple
-    Either the string `'SAME'`, the string `'VALID'`, or a sequence of n `(low,
-    high)` integer pairs that give the padding to apply before and after each
-    spatial dimension.
-  lhs_dilation: int, sequence of int
-    An integer or a sequence of `n` integers, giving the
-    dilation factor to apply in each spatial dimension of `inputs`
-    (default: 1). Convolution with input dilation `d` is equivalent to
-    transposed convolution with stride `d`.
-  rhs_dilation: int, sequence of int
-    An integer or a sequence of `n` integers, giving the
-    dilation factor to apply in each spatial dimension of the convolution
-    kernel (default: 1). Convolution with kernel dilation
-    is also known as 'atrous convolution'.
-  groups: int
-    If specified, divides the input features into groups. default 1.
-  w_init: Callable, ArrayLike, Initializer
-    The initializer for the convolutional kernel.
-  b_init: Optional, Callable, ArrayLike, Initializer
-    The initializer for the bias.
-  w_mask: ArrayLike, Callable, Optional
-    The optional mask of the weights.
-  mode: Mode
-    The computation mode of the current object. Default it is `training`.
-  name: str, Optional
-    The name of the object.
-'''
-Conv1d.__doc__ = Conv1d.__doc__ % _conv_doc
-Conv2d.__doc__ = Conv2d.__doc__ % _conv_doc
-Conv3d.__doc__ = Conv3d.__doc__ % _conv_doc
-class _ScaledWSConv(_BaseConv):
-    def __init__(
-        self,
-        in_size: Sequence[int],
-        out_channels: int,
-        kernel_size: Union[int, Tuple[int, ...]],
-        stride: Union[int, Tuple[int, ...]] = 1,
-        padding: Union[str, int, Tuple[int, int], Sequence[Tuple[int, int]]] = 'SAME',
-        lhs_dilation: Union[int, Tuple[int, ...]] = 1,
-        rhs_dilation: Union[int, Tuple[int, ...]] = 1,
-        groups: int = 1,
-        ws_gain: bool = True,
-        eps: float = 1e-4,
-        w_init: Union[Callable, ArrayLike] = init.XavierNormal(),
-        b_init: Optional[Union[Callable, ArrayLike]] = None,
-        w_mask: Optional[Union[ArrayLike, Callable]] = None,
-        name: str = None,
-        param_type: type = ParamState,
-    ):
-        super().__init__(in_size=in_size,
-                         out_channels=out_channels,
-                         kernel_size=kernel_size,
-                         stride=stride,
-                         padding=padding,
-                         lhs_dilation=lhs_dilation,
-                         rhs_dilation=rhs_dilation,
-                         groups=groups,
-                         w_mask=w_mask,
-                         name=name, )
-        self.w_initializer = w_init
-        self.b_initializer = b_init
-        # --- weights --- #
-        weight = init.param(self.w_initializer, self.kernel_shape, allow_none=False)
-        params = dict(weight=weight)
-        if self.b_initializer is not None:
-            bias_shape = (1,) * len(self.kernel_size) + (self.out_channels,)
-            bias = init.param(self.b_initializer, bias_shape, allow_none=True)
-            params['bias'] = bias
-        # gain
-        if ws_gain:
-            gain_size = (1,) * len(self.kernel_size) + (1, self.out_channels)
-            ws_gain = jnp.ones(gain_size, dtype=params['weight'].dtype)
-            params['gain'] = ws_gain
-        # Epsilon, a small constant to avoid dividing by zero.
-        self.eps = eps
-        # The weight operation
-        self.weight = param_type(params)
-        # Evaluate the output shape
-        abstract_y = jax.eval_shape(
-            self._conv_op,
-            jax.ShapeDtypeStruct((128,) + self.in_size, weight.dtype),
-            params
-        )
-        y_shape = abstract_y.shape[1:]
-        self.out_size = y_shape
-    def _conv_op(self, x, params):
-        w = params['weight']
-        w = functional.weight_standardization(w, self.eps, params.get('gain', None))
-        if self.w_mask is not None:
-            w = w * self.w_mask
-        y = jax.lax.conv_general_dilated(
-            lhs=x,
-            rhs=w,
-            window_strides=self.stride,
-            padding=self.padding,
-            lhs_dilation=self.lhs_dilation,
-            rhs_dilation=self.rhs_dilation,
-            feature_group_count=self.groups,
-            dimension_numbers=self.dimension_numbers
-        )
-        if 'bias' in params:
-            y = y + params['bias']
-        return y
-class ScaledWSConv1d(_ScaledWSConv):
-    """One-dimensional convolution with weight standardization.
-    The input should be a 3d array with the shape of ``[B, H, C]``.
-    Parameters
-    ----------
-    %s
-    """
-    __module__ = 'brainstate.nn'
-    num_spatial_dims: int = 1
-class ScaledWSConv2d(_ScaledWSConv):
-    """Two-dimensional convolution with weight standardization.
-    The input should be a 4d array with the shape of ``[B, H, W, C]``.
-    Parameters
-    ----------
-    %s
-    """
-    __module__ = 'brainstate.nn'
-    num_spatial_dims: int = 2
-class ScaledWSConv3d(_ScaledWSConv):
-    """Three-dimensional convolution with weight standardization.
-    The input should be a 5d array with the shape of ``[B, H, W, D, C]``.
-    Parameters
-    ----------
-    %s
-    """
-    __module__ = 'brainstate.nn'
-    num_spatial_dims: int = 3
-_ws_conv_doc = '''
-  in_size: tuple of int
-    The input shape, without the batch size. This argument is important, since it is
-    used to evaluate the shape of the output.
-  out_channels: int
-    The number of output channels.
-  kernel_size: int, sequence of int
-    The shape of the convolutional kernel.
-    For 1D convolution, the kernel size can be passed as an integer.
-    For all other cases, it must be a sequence of integers.
-  stride: int, sequence of int
-    An integer or a sequence of `n` integers, representing the inter-window strides (default: 1).
-  padding: str, int, sequence of int, sequence of tuple
-    Either the string `'SAME'`, the string `'VALID'`, or a sequence of n `(low,
-    high)` integer pairs that give the padding to apply before and after each
-    spatial dimension.
-  lhs_dilation: int, sequence of int
-    An integer or a sequence of `n` integers, giving the
-    dilation factor to apply in each spatial dimension of `inputs`
-    (default: 1). Convolution with input dilation `d` is equivalent to
-    transposed convolution with stride `d`.
-  rhs_dilation: int, sequence of int
-    An integer or a sequence of `n` integers, giving the
-    dilation factor to apply in each spatial dimension of the convolution
-    kernel (default: 1). Convolution with kernel dilation
-    is also known as 'atrous convolution'.
-  groups: int
-    If specified, divides the input features into groups. default 1.
-  w_init: Callable, ArrayLike, Initializer
-    The initializer for the convolutional kernel.
-  b_init: Optional, Callable, ArrayLike, Initializer
-    The initializer for the bias.
-  ws_gain: bool
-    Whether to add a gain term for the weight standarization. The default is `True`.
-  eps: float
-    The epsilon value for numerical stability.
-  w_mask: ArrayLike, Callable, Optional
-    The optional mask of the weights.
-  mode: Mode
-    The computation mode of the current object. Default it is `training`.
-  name: str, Optional
-    The name of the object.
-'''
-ScaledWSConv1d.__doc__ = ScaledWSConv1d.__doc__ % _ws_conv_doc
-ScaledWSConv2d.__doc__ = ScaledWSConv2d.__doc__ % _ws_conv_doc
-ScaledWSConv3d.__doc__ = ScaledWSConv3d.__doc__ % _ws_conv_doc
+# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+# -*- coding: utf-8 -*-
+import collections.abc
+from typing import Callable, Tuple, Union, Sequence, Optional, TypeVar
+import jax
+import jax.numpy as jnp
+from brainstate import init, functional
+from brainstate._state import ParamState
+from brainstate.typing import ArrayLike
+from ._module import Module
+T = TypeVar('T')
+__all__ = [
+    'Conv1d', 'Conv2d', 'Conv3d',
+    'ScaledWSConv1d', 'ScaledWSConv2d', 'ScaledWSConv3d',
+]
+def to_dimension_numbers(
+    num_spatial_dims: int,
+    channels_last: bool,
+    transpose: bool
+) -> jax.lax.ConvDimensionNumbers:
+    """Create a `lax.ConvDimensionNumbers` for the given inputs."""
+    num_dims = num_spatial_dims + 2
+    if channels_last:
+        spatial_dims = tuple(range(1, num_dims - 1))
+        image_dn = (0, num_dims - 1) + spatial_dims
+    else:
+        spatial_dims = tuple(range(2, num_dims))
+        image_dn = (0, 1) + spatial_dims
+    if transpose:
+        kernel_dn = (num_dims - 2, num_dims - 1) + tuple(range(num_dims - 2))
+    else:
+        kernel_dn = (num_dims - 1, num_dims - 2) + tuple(range(num_dims - 2))
+    return jax.lax.ConvDimensionNumbers(lhs_spec=image_dn,
+                                        rhs_spec=kernel_dn,
+                                        out_spec=image_dn)
+def replicate(
+    element: Union[T, Sequence[T]],
+    num_replicate: int,
+    name: str,
+) -> Tuple[T, ...]:
+    """Replicates entry in `element` `num_replicate` if needed."""
+    if isinstance(element, (str, bytes)) or not isinstance(element, collections.abc.Sequence):
+        return (element,) * num_replicate
+    elif len(element) == 1:
+        return tuple(list(element) * num_replicate)
+    elif len(element) == num_replicate:
+        return tuple(element)
+    else:
+        raise TypeError(f"{name} must be a scalar or sequence of length 1 or "
+                        f"sequence of length {num_replicate}.")
+class _BaseConv(Module):
+    # the number of spatial dimensions
+    num_spatial_dims: int
+    # the weight and its operations
+    weight: ParamState
+    def __init__(
+        self,
+        in_size: Sequence[int],
+        out_channels: int,
+        kernel_size: Union[int, Tuple[int, ...]],
+        stride: Union[int, Tuple[int, ...]] = 1,
+        padding: Union[str, int, Tuple[int, int], Sequence[Tuple[int, int]]] = 'SAME',
+        lhs_dilation: Union[int, Tuple[int, ...]] = 1,
+        rhs_dilation: Union[int, Tuple[int, ...]] = 1,
+        groups: int = 1,
+        w_mask: Optional[Union[ArrayLike, Callable]] = None,
+        name: str = None,
+    ):
+        super().__init__(name=name)
+        # general parameters
+        assert self.num_spatial_dims + 1 == len(in_size)
+        self.in_size = tuple(in_size)
+        self.in_channels = in_size[-1]
+        self.out_channels = out_channels
+        self.stride = replicate(stride, self.num_spatial_dims, 'stride')
+        self.kernel_size = replicate(kernel_size, self.num_spatial_dims, 'kernel_size')
+        self.lhs_dilation = replicate(lhs_dilation, self.num_spatial_dims, 'lhs_dilation')
+        self.rhs_dilation = replicate(rhs_dilation, self.num_spatial_dims, 'rhs_dilation')
+        self.groups = groups
+        self.dimension_numbers = to_dimension_numbers(self.num_spatial_dims, channels_last=True, transpose=False)
+        # the padding parameter
+        if isinstance(padding, str):
+            assert padding in ['SAME', 'VALID']
+        elif isinstance(padding, int):
+            padding = tuple((padding, padding) for _ in range(self.num_spatial_dims))
+        elif isinstance(padding, (tuple, list)):
+            if isinstance(padding[0], int):
+                padding = (padding,) * self.num_spatial_dims
+            elif isinstance(padding[0], (tuple, list)):
+                if len(padding) == 1:
+                    padding = tuple(padding) * self.num_spatial_dims
+                else:
+                    if len(padding) != self.num_spatial_dims:
+                        raise ValueError(
+                            f"Padding {padding} must be a Tuple[int, int], "
+                            f"or sequence of Tuple[int, int] with length 1, "
+                            f"or sequence of Tuple[int, int] with length {self.num_spatial_dims}."
+                        )
+                    padding = tuple(padding)
+        else:
+            raise ValueError
+        self.padding = padding
+        # the number of in-/out-channels
+        assert self.out_channels % self.groups == 0, '"out_channels" should be divisible by groups'
+        assert self.in_channels % self.groups == 0, '"in_channels" should be divisible by groups'
+        # kernel shape and w_mask
+        kernel_shape = tuple(self.kernel_size) + (self.in_channels // self.groups, self.out_channels)
+        self.kernel_shape = kernel_shape
+        self.w_mask = init.param(w_mask, kernel_shape, allow_none=True)
+    def _check_input_dim(self, x):
+        if x.ndim == self.num_spatial_dims + 2:
+            x_shape = x.shape[1:]
+        elif x.ndim == self.num_spatial_dims + 1:
+            x_shape = x.shape
+        else:
+            raise ValueError(f"expected {self.num_spatial_dims + 2}D (with batch) or "
+                             f"{self.num_spatial_dims + 1}D (without batch) input (got {x.ndim}D input, {x.shape})")
+        if self.in_size != x_shape:
+            raise ValueError(f"The expected input shape is {self.in_size}, while we got {x_shape}.")
+    def update(self, x):
+        self._check_input_dim(x)
+        non_batching = False
+        if x.ndim == self.num_spatial_dims + 1:
+            x = jnp.expand_dims(x, 0)
+            non_batching = True
+        y = self._conv_op(x, self.weight.value)
+        return y[0] if non_batching else y
+    def _conv_op(self, x, params):
+        raise NotImplementedError
+    def __repr__(self):
+        return (f'{self.__class__.__name__}('
+                f'in_channels={self.in_channels}, '
+                f'out_channels={self.out_channels}, '
+                f'kernel_size={self.kernel_size}, '
+                f'stride={self.stride}, '
+                f'padding={self.padding}, '
+                f'groups={self.groups})')
+class _Conv(_BaseConv):
+    num_spatial_dims: int = None
+    def __init__(
+        self,
+        in_size: Sequence[int],
+        out_channels: int,
+        kernel_size: Union[int, Tuple[int, ...]],
+        stride: Union[int, Tuple[int, ...]] = 1,
+        padding: Union[str, int, Tuple[int, int], Sequence[Tuple[int, int]]] = 'SAME',
+        lhs_dilation: Union[int, Tuple[int, ...]] = 1,
+        rhs_dilation: Union[int, Tuple[int, ...]] = 1,
+        groups: int = 1,
+        w_init: Union[Callable, ArrayLike] = init.XavierNormal(),
+        b_init: Optional[Union[Callable, ArrayLike]] = None,
+        w_mask: Optional[Union[ArrayLike, Callable]] = None,
+        name: str = None,
+        param_type: type = ParamState,
+    ):
+        super().__init__(
+            in_size=in_size,
+            out_channels=out_channels,
+            kernel_size=kernel_size,
+            stride=stride,
+            padding=padding,
+            lhs_dilation=lhs_dilation,
+            rhs_dilation=rhs_dilation,
+            groups=groups,
+            w_mask=w_mask,
+            name=name
+        )
+        self.w_initializer = w_init
+        self.b_initializer = b_init
+        # --- weights --- #
+        weight = init.param(self.w_initializer, self.kernel_shape, allow_none=False)
+        params = dict(weight=weight)
+        if self.b_initializer is not None:
+            bias_shape = (1,) * len(self.kernel_size) + (self.out_channels,)
+            bias = init.param(self.b_initializer, bias_shape, allow_none=True)
+            params['bias'] = bias
+        # The weight operation
+        self.weight = param_type(params)
+        # Evaluate the output shape
+        abstract_y = jax.eval_shape(
+            self._conv_op,
+            jax.ShapeDtypeStruct((128,) + self.in_size, weight.dtype),
+            params
+        )
+        y_shape = abstract_y.shape[1:]
+        self.out_size = y_shape
+    def _conv_op(self, x, params):
+        w = params['weight']
+        if self.w_mask is not None:
+            w = w * self.w_mask
+        y = jax.lax.conv_general_dilated(
+            lhs=x,
+            rhs=w,
+            window_strides=self.stride,
+            padding=self.padding,
+            lhs_dilation=self.lhs_dilation,
+            rhs_dilation=self.rhs_dilation,
+            feature_group_count=self.groups,
+            dimension_numbers=self.dimension_numbers
+        )
+        if 'bias' in params:
+            y = y + params['bias']
+        return y
+class Conv1d(_Conv):
+    """One-dimensional convolution.
+    The input should be a 3d array with the shape of ``[B, H, C]``.
+    Parameters
+    ----------
+    %s
+    """
+    __module__ = 'brainstate.nn'
+    num_spatial_dims: int = 1
+class Conv2d(_Conv):
+    """Two-dimensional convolution.
+    The input should be a 4d array with the shape of ``[B, H, W, C]``.
+    Parameters
+    ----------
+    %s
+    """
+    __module__ = 'brainstate.nn'
+    num_spatial_dims: int = 2
+class Conv3d(_Conv):
+    """Three-dimensional convolution.
+    The input should be a 5d array with the shape of ``[B, H, W, D, C]``.
+    Parameters
+    ----------
+    %s
+    """
+    __module__ = 'brainstate.nn'
+    num_spatial_dims: int = 3
+_conv_doc = '''
+  in_size: tuple of int
+    The input shape, without the batch size. This argument is important, since it is
+    used to evaluate the shape of the output.
+  out_channels: int
+    The number of output channels.
+  kernel_size: int, sequence of int
+    The shape of the convolutional kernel.
+    For 1D convolution, the kernel size can be passed as an integer.
+    For all other cases, it must be a sequence of integers.
+  stride: int, sequence of int
+    An integer or a sequence of `n` integers, representing the inter-window strides (default: 1).
+  padding: str, int, sequence of int, sequence of tuple
+    Either the string `'SAME'`, the string `'VALID'`, or a sequence of n `(low,
+    high)` integer pairs that give the padding to apply before and after each
+    spatial dimension.
+  lhs_dilation: int, sequence of int
+    An integer or a sequence of `n` integers, giving the
+    dilation factor to apply in each spatial dimension of `inputs`
+    (default: 1). Convolution with input dilation `d` is equivalent to
+    transposed convolution with stride `d`.
+  rhs_dilation: int, sequence of int
+    An integer or a sequence of `n` integers, giving the
+    dilation factor to apply in each spatial dimension of the convolution
+    kernel (default: 1). Convolution with kernel dilation
+    is also known as 'atrous convolution'.
+  groups: int
+    If specified, divides the input features into groups. default 1.
+  w_init: Callable, ArrayLike, Initializer
+    The initializer for the convolutional kernel.
+  b_init: Optional, Callable, ArrayLike, Initializer
+    The initializer for the bias.
+  w_mask: ArrayLike, Callable, Optional
+    The optional mask of the weights.
+  mode: Mode
+    The computation mode of the current object. Default it is `training`.
+  name: str, Optional
+    The name of the object.
+'''
+Conv1d.__doc__ = Conv1d.__doc__ % _conv_doc
+Conv2d.__doc__ = Conv2d.__doc__ % _conv_doc
+Conv3d.__doc__ = Conv3d.__doc__ % _conv_doc
+class _ScaledWSConv(_BaseConv):
+    def __init__(
+        self,
+        in_size: Sequence[int],
+        out_channels: int,
+        kernel_size: Union[int, Tuple[int, ...]],
+        stride: Union[int, Tuple[int, ...]] = 1,
+        padding: Union[str, int, Tuple[int, int], Sequence[Tuple[int, int]]] = 'SAME',
+        lhs_dilation: Union[int, Tuple[int, ...]] = 1,
+        rhs_dilation: Union[int, Tuple[int, ...]] = 1,
+        groups: int = 1,
+        ws_gain: bool = True,
+        eps: float = 1e-4,
+        w_init: Union[Callable, ArrayLike] = init.XavierNormal(),
+        b_init: Optional[Union[Callable, ArrayLike]] = None,
+        w_mask: Optional[Union[ArrayLike, Callable]] = None,
+        name: str = None,
+        param_type: type = ParamState,
+    ):
+        super().__init__(in_size=in_size,
+                         out_channels=out_channels,
+                         kernel_size=kernel_size,
+                         stride=stride,
+                         padding=padding,
+                         lhs_dilation=lhs_dilation,
+                         rhs_dilation=rhs_dilation,
+                         groups=groups,
+                         w_mask=w_mask,
+                         name=name, )
+        self.w_initializer = w_init
+        self.b_initializer = b_init
+        # --- weights --- #
+        weight = init.param(self.w_initializer, self.kernel_shape, allow_none=False)
+        params = dict(weight=weight)
+        if self.b_initializer is not None:
+            bias_shape = (1,) * len(self.kernel_size) + (self.out_channels,)
+            bias = init.param(self.b_initializer, bias_shape, allow_none=True)
+            params['bias'] = bias
+        # gain
+        if ws_gain:
+            gain_size = (1,) * len(self.kernel_size) + (1, self.out_channels)
+            ws_gain = jnp.ones(gain_size, dtype=params['weight'].dtype)
+            params['gain'] = ws_gain
+        # Epsilon, a small constant to avoid dividing by zero.
+        self.eps = eps
+        # The weight operation
+        self.weight = param_type(params)
+        # Evaluate the output shape
+        abstract_y = jax.eval_shape(
+            self._conv_op,
+            jax.ShapeDtypeStruct((128,) + self.in_size, weight.dtype),
+            params
+        )
+        y_shape = abstract_y.shape[1:]
+        self.out_size = y_shape
+    def _conv_op(self, x, params):
+        w = params['weight']
+        w = functional.weight_standardization(w, self.eps, params.get('gain', None))
+        if self.w_mask is not None:
+            w = w * self.w_mask
+        y = jax.lax.conv_general_dilated(
+            lhs=x,
+            rhs=w,
+            window_strides=self.stride,
+            padding=self.padding,
+            lhs_dilation=self.lhs_dilation,
+            rhs_dilation=self.rhs_dilation,
+            feature_group_count=self.groups,
+            dimension_numbers=self.dimension_numbers
+        )
+        if 'bias' in params:
+            y = y + params['bias']
+        return y
+class ScaledWSConv1d(_ScaledWSConv):
+    """One-dimensional convolution with weight standardization.
+    The input should be a 3d array with the shape of ``[B, H, C]``.
+    Parameters
+    ----------
+    %s
+    """
+    __module__ = 'brainstate.nn'
+    num_spatial_dims: int = 1
+class ScaledWSConv2d(_ScaledWSConv):
+    """Two-dimensional convolution with weight standardization.
+    The input should be a 4d array with the shape of ``[B, H, W, C]``.
+    Parameters
+    ----------
+    %s
+    """
+    __module__ = 'brainstate.nn'
+    num_spatial_dims: int = 2
+class ScaledWSConv3d(_ScaledWSConv):
+    """Three-dimensional convolution with weight standardization.
+    The input should be a 5d array with the shape of ``[B, H, W, D, C]``.
+    Parameters
+    ----------
+    %s
+    """
+    __module__ = 'brainstate.nn'
+    num_spatial_dims: int = 3
+_ws_conv_doc = '''
+  in_size: tuple of int
+    The input shape, without the batch size. This argument is important, since it is
+    used to evaluate the shape of the output.
+  out_channels: int
+    The number of output channels.
+  kernel_size: int, sequence of int
+    The shape of the convolutional kernel.
+    For 1D convolution, the kernel size can be passed as an integer.
+    For all other cases, it must be a sequence of integers.
+  stride: int, sequence of int
+    An integer or a sequence of `n` integers, representing the inter-window strides (default: 1).
+  padding: str, int, sequence of int, sequence of tuple
+    Either the string `'SAME'`, the string `'VALID'`, or a sequence of n `(low,
+    high)` integer pairs that give the padding to apply before and after each
+    spatial dimension.
+  lhs_dilation: int, sequence of int
+    An integer or a sequence of `n` integers, giving the
+    dilation factor to apply in each spatial dimension of `inputs`
+    (default: 1). Convolution with input dilation `d` is equivalent to
+    transposed convolution with stride `d`.
+  rhs_dilation: int, sequence of int
+    An integer or a sequence of `n` integers, giving the
+    dilation factor to apply in each spatial dimension of the convolution
+    kernel (default: 1). Convolution with kernel dilation
+    is also known as 'atrous convolution'.
+  groups: int
+    If specified, divides the input features into groups. default 1.
+  w_init: Callable, ArrayLike, Initializer
+    The initializer for the convolutional kernel.
+  b_init: Optional, Callable, ArrayLike, Initializer
+    The initializer for the bias.
+  ws_gain: bool
+    Whether to add a gain term for the weight standarization. The default is `True`.
+  eps: float
+    The epsilon value for numerical stability.
+  w_mask: ArrayLike, Callable, Optional
+    The optional mask of the weights.
+  mode: Mode
+    The computation mode of the current object. Default it is `training`.
+  name: str, Optional
+    The name of the object.
+'''
+ScaledWSConv1d.__doc__ = ScaledWSConv1d.__doc__ % _ws_conv_doc
+ScaledWSConv2d.__doc__ = ScaledWSConv2d.__doc__ % _ws_conv_doc
+ScaledWSConv3d.__doc__ = ScaledWSConv3d.__doc__ % _ws_conv_doc

brainstate 0.1.8__py2.py3-none-any.whl → 0.1.9__py2.py3-none-any.whl

brainstate 0.1.8py2.py3-none-any.whl → 0.1.9py2.py3-none-any.whl