PyPI - brainstate - Versions diffs - 0.1.10__py2.py3-none-any.whl → 0.2.0__py2.py3-none-any.whl - Mend

brainstate 0.1.10py2.py3-none-any.whl → 0.2.0py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (163) hide show

brainstate/__init__.py +130 -19
brainstate/_compatible_import.py +201 -9
brainstate/_compatible_import_test.py +681 -0
brainstate/_deprecation.py +210 -0
brainstate/_deprecation_test.py +2319 -0
brainstate/{util/error.py → _error.py} +10 -20
brainstate/_state.py +94 -47
brainstate/_state_test.py +1 -1
brainstate/_utils.py +1 -1
brainstate/environ.py +1279 -347
brainstate/environ_test.py +1187 -26
brainstate/graph/__init__.py +6 -13
brainstate/graph/_node.py +240 -0
brainstate/graph/_node_test.py +589 -0
brainstate/graph/{_graph_operation.py → _operation.py} +632 -746
brainstate/graph/_operation_test.py +1147 -0
brainstate/mixin.py +1209 -141
brainstate/mixin_test.py +991 -51
brainstate/nn/__init__.py +74 -72
brainstate/nn/_activations.py +587 -295
brainstate/nn/_activations_test.py +109 -86
brainstate/nn/_collective_ops.py +393 -274
brainstate/nn/_collective_ops_test.py +746 -15
brainstate/nn/_common.py +114 -66
brainstate/nn/_common_test.py +154 -0
brainstate/nn/_conv.py +1652 -143
brainstate/nn/_conv_test.py +838 -227
brainstate/nn/_delay.py +15 -28
brainstate/nn/_delay_test.py +25 -20
brainstate/nn/_dropout.py +359 -167
brainstate/nn/_dropout_test.py +429 -52
brainstate/nn/_dynamics.py +14 -90
brainstate/nn/_dynamics_test.py +1 -12
brainstate/nn/_elementwise.py +492 -313
brainstate/nn/_elementwise_test.py +806 -145
brainstate/nn/_embedding.py +369 -19
brainstate/nn/_embedding_test.py +156 -0
brainstate/nn/{_fixedprob.py → _event_fixedprob.py} +10 -16
brainstate/nn/{_fixedprob_test.py → _event_fixedprob_test.py} +6 -5
brainstate/nn/{_linear_mv.py → _event_linear.py} +2 -2
brainstate/nn/{_linear_mv_test.py → _event_linear_test.py} +6 -5
brainstate/nn/_exp_euler.py +200 -38
brainstate/nn/_exp_euler_test.py +350 -8
brainstate/nn/_linear.py +391 -71
brainstate/nn/_linear_test.py +427 -59
brainstate/nn/_metrics.py +1070 -0
brainstate/nn/_metrics_test.py +611 -0
brainstate/nn/_module.py +10 -3
brainstate/nn/_module_test.py +1 -1
brainstate/nn/_normalizations.py +688 -329
brainstate/nn/_normalizations_test.py +663 -37
brainstate/nn/_paddings.py +1020 -0
brainstate/nn/_paddings_test.py +723 -0
brainstate/nn/_poolings.py +1404 -342
brainstate/nn/_poolings_test.py +828 -92
brainstate/nn/{_rate_rnns.py → _rnns.py} +446 -54
brainstate/nn/_rnns_test.py +593 -0
brainstate/nn/_utils.py +132 -5
brainstate/nn/_utils_test.py +402 -0
brainstate/{init/_random_inits.py → nn/init.py} +301 -45
brainstate/{init/_random_inits_test.py → nn/init_test.py} +51 -20
brainstate/random/__init__.py +247 -1
brainstate/random/_rand_funs.py +668 -346
brainstate/random/_rand_funs_test.py +74 -1
brainstate/random/_rand_seed.py +541 -76
brainstate/random/_rand_seed_test.py +1 -1
brainstate/random/_rand_state.py +601 -393
brainstate/random/_rand_state_test.py +551 -0
brainstate/transform/__init__.py +59 -0
brainstate/transform/_ad_checkpoint.py +176 -0
brainstate/{compile → transform}/_ad_checkpoint_test.py +1 -1
brainstate/{augment → transform}/_autograd.py +360 -113
brainstate/{augment → transform}/_autograd_test.py +2 -2
brainstate/transform/_conditions.py +316 -0
brainstate/{compile → transform}/_conditions_test.py +11 -11
brainstate/{compile → transform}/_error_if.py +22 -20
brainstate/{compile → transform}/_error_if_test.py +1 -1
brainstate/transform/_eval_shape.py +145 -0
brainstate/{augment → transform}/_eval_shape_test.py +1 -1
brainstate/{compile → transform}/_jit.py +99 -46
brainstate/{compile → transform}/_jit_test.py +3 -3
brainstate/{compile → transform}/_loop_collect_return.py +219 -80
brainstate/{compile → transform}/_loop_collect_return_test.py +1 -1
brainstate/{compile → transform}/_loop_no_collection.py +133 -34
brainstate/{compile → transform}/_loop_no_collection_test.py +2 -2
brainstate/transform/_make_jaxpr.py +2016 -0
brainstate/transform/_make_jaxpr_test.py +1510 -0
brainstate/transform/_mapping.py +529 -0
brainstate/transform/_mapping_test.py +194 -0
brainstate/{compile → transform}/_progress_bar.py +78 -25
brainstate/{augment → transform}/_random.py +65 -45
brainstate/{compile → transform}/_unvmap.py +102 -5
brainstate/transform/_util.py +286 -0
brainstate/typing.py +594 -61
brainstate/typing_test.py +780 -0
brainstate/util/__init__.py +9 -32
brainstate/util/_others.py +1025 -0
brainstate/util/_others_test.py +962 -0
brainstate/util/_pretty_pytree.py +1301 -0
brainstate/util/_pretty_pytree_test.py +675 -0
brainstate/util/{pretty_repr.py → _pretty_repr.py} +161 -27
brainstate/util/_pretty_repr_test.py +696 -0
brainstate/util/filter.py +557 -81
brainstate/util/filter_test.py +912 -0
brainstate/util/struct.py +769 -382
brainstate/util/struct_test.py +602 -0
{brainstate-0.1.10.dist-info → brainstate-0.2.0.dist-info}/METADATA +34 -17
brainstate-0.2.0.dist-info/RECORD +111 -0
brainstate/augment/__init__.py +0 -30
brainstate/augment/_eval_shape.py +0 -99
brainstate/augment/_mapping.py +0 -1060
brainstate/augment/_mapping_test.py +0 -597
brainstate/compile/__init__.py +0 -38
brainstate/compile/_ad_checkpoint.py +0 -204
brainstate/compile/_conditions.py +0 -256
brainstate/compile/_make_jaxpr.py +0 -888
brainstate/compile/_make_jaxpr_test.py +0 -156
brainstate/compile/_util.py +0 -147
brainstate/functional/__init__.py +0 -27
brainstate/graph/_graph_node.py +0 -244
brainstate/graph/_graph_node_test.py +0 -73
brainstate/graph/_graph_operation_test.py +0 -563
brainstate/init/__init__.py +0 -26
brainstate/init/_base.py +0 -52
brainstate/init/_generic.py +0 -244
brainstate/init/_regular_inits.py +0 -105
brainstate/init/_regular_inits_test.py +0 -50
brainstate/nn/_inputs.py +0 -608
brainstate/nn/_ltp.py +0 -28
brainstate/nn/_neuron.py +0 -705
brainstate/nn/_neuron_test.py +0 -161
brainstate/nn/_others.py +0 -46
brainstate/nn/_projection.py +0 -486
brainstate/nn/_rate_rnns_test.py +0 -63
brainstate/nn/_readout.py +0 -209
brainstate/nn/_readout_test.py +0 -53
brainstate/nn/_stp.py +0 -236
brainstate/nn/_synapse.py +0 -505
brainstate/nn/_synapse_test.py +0 -131
brainstate/nn/_synaptic_projection.py +0 -423
brainstate/nn/_synouts.py +0 -162
brainstate/nn/_synouts_test.py +0 -57
brainstate/nn/metrics.py +0 -388
brainstate/optim/__init__.py +0 -38
brainstate/optim/_base.py +0 -64
brainstate/optim/_lr_scheduler.py +0 -448
brainstate/optim/_lr_scheduler_test.py +0 -50
brainstate/optim/_optax_optimizer.py +0 -152
brainstate/optim/_optax_optimizer_test.py +0 -53
brainstate/optim/_sgd_optimizer.py +0 -1104
brainstate/random/_random_for_unit.py +0 -52
brainstate/surrogate.py +0 -1957
brainstate/transform.py +0 -23
brainstate/util/caller.py +0 -98
brainstate/util/others.py +0 -540
brainstate/util/pretty_pytree.py +0 -945
brainstate/util/pretty_pytree_test.py +0 -159
brainstate/util/pretty_table.py +0 -2954
brainstate/util/scaling.py +0 -258
brainstate-0.1.10.dist-info/RECORD +0 -130
{brainstate-0.1.10.dist-info → brainstate-0.2.0.dist-info}/WHEEL +0 -0
{brainstate-0.1.10.dist-info → brainstate-0.2.0.dist-info}/licenses/LICENSE +0 -0
{brainstate-0.1.10.dist-info → brainstate-0.2.0.dist-info}/top_level.txt +0 -0

brainstate/{init/_random_inits.py → nn/init.py} RENAMED Viewed

@@ -1,4 +1,4 @@
-# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
+# Copyright 2025 BrainX Ecosystem Limited. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -13,19 +13,27 @@
 # limitations under the License.
 # ==============================================================================
-# -*- coding: utf-8 -*-
 import math
+from typing import Optional, Tuple
+from typing import Union, Callable, Sequence
 import brainunit as u
+import jax
 import jax.numpy as jnp
 import numpy as np
 from brainstate import environ, random
-from brainstate.typing import ArrayLike, SeedOrKey, DTypeLike
-from ._base import Initializer, to_size
+from brainstate._state import State
+from brainstate._utils import set_module_as
+from brainstate.typing import ArrayLike, SeedOrKey
+from brainstate.util import PrettyRepr, PrettyType, PrettyAttr
 __all__ = [
+    'param',
+    'calculate_init_gain',
+    'ZeroInit',
+    'Constant',
+    'Identity',
     'Normal',
     'TruncatedNormal',
     'Uniform',
@@ -41,7 +49,170 @@ __all__ = [
 ]
-def calculate_gain(nonlinearity, param=None):
+class Initializer(PrettyRepr):
+    """
+    Base class for initializers.
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, *args, **kwargs):
+        raise NotImplementedError
+    def __pretty_repr__(self):
+        """
+        Pretty repr for the object.
+        """
+        yield PrettyType(type=type(self))
+        for name, value in vars(self).items():
+            if name.startswith('_'):
+                continue
+            yield PrettyAttr(name, repr(value))
+def to_size(x) -> Optional[Tuple[int]]:
+    if isinstance(x, (tuple, list)):
+        return tuple(x)
+    if isinstance(x, (int, np.integer)):
+        return (x,)
+    if x is None:
+        return x
+    raise ValueError(f'Cannot make a size for {x}')
+def _is_scalar(x):
+    return u.math.isscalar(x)
+def are_broadcastable_shapes(shape1, shape2):
+    """
+    Check if two shapes are broadcastable.
+    Parameters:
+    - shape1: Tuple[int], the shape of the first array.
+    - shape2: Tuple[int], the shape of the second array.
+    Returns:
+    - bool: True if shapes are broadcastable, False otherwise.
+    """
+    # Reverse the shapes to compare from the last dimension
+    shape1_reversed = shape1[::-1]
+    shape2_reversed = shape2[::-1]
+    # Iterate over the dimensions of the shorter shape
+    for dim1, dim2 in zip(shape1_reversed, shape2_reversed):
+        # Check if the dimensions are not equal and neither is 1
+        if dim1 != dim2 and 1 not in (dim1, dim2):
+            return False
+    # If all dimensions are compatible, the shapes are broadcastable
+    return True
+def _expand_params_to_match_sizes(params, sizes):
+    """
+    Expand the dimensions of params to match the dimensions of sizes.
+    Parameters:
+    - params: jax.Array or np.ndarray, the parameter array to be expanded.
+    - sizes: tuple[int] or list[int], the target shape dimensions.
+    Returns:
+    - Expanded params with dimensions matching sizes.
+    """
+    params_dim = params.ndim
+    sizes_dim = len(sizes)
+    dim_diff = sizes_dim - params_dim
+    # Add new axes to params if it has fewer dimensions than sizes
+    for _ in range(dim_diff):
+        params = u.math.expand_dims(params, axis=0)  # Add new axis at the last dimension
+    return params
+@set_module_as('brainstate.nn')
+def param(
+    parameter: Union[Callable, ArrayLike, State],
+    sizes: Union[int, Sequence[int]],
+    batch_size: Optional[int] = None,
+    allow_none: bool = True,
+    allow_scalar: bool = True,
+):
+    """Initialize parameters.
+    Parameters
+    ----------
+    parameter: callable, ArrayLike, State
+      The initialization of the parameter.
+      - If it is None, the created parameter will be None.
+      - If it is a callable function :math:`f`, the ``f(size)`` will be returned.
+      - If it is an instance of :py:class:`init.Initializer``, the ``f(size)`` will be returned.
+      - If it is a tensor, then this function check whether ``tensor.shape`` is equal to the given ``size``.
+    sizes: int, sequence of int
+      The shape of the parameter.
+    batch_size: int
+      The batch size.
+    allow_none: bool
+      Whether allow the parameter is None.
+    allow_scalar: bool
+      Whether allow the parameter is a scalar value.
+    Returns
+    -------
+    param: ArrayType, float, int, bool, None
+      The initialized parameter.
+    See Also
+    --------
+    noise, state
+    """
+    # Check if the parameter is None
+    if parameter is None:
+        if allow_none:
+            return None
+        else:
+            raise ValueError(f'Expect a parameter with type of float, ArrayType, Initializer, or '
+                             f'Callable function, but we got None. ')
+    # Check if the parameter is a scalar value
+    if allow_scalar and _is_scalar(parameter):
+        return parameter
+    # Convert sizes to a tuple
+    sizes = tuple(to_size(sizes))
+    # Check if the parameter is a callable function
+    if callable(parameter):
+        if batch_size is not None:
+            sizes = (batch_size,) + sizes
+        return parameter(sizes)
+    elif isinstance(parameter, (np.ndarray, jax.Array, u.Quantity, State)):
+        parameter = parameter
+    else:
+        raise ValueError(f'Unknown parameter type: {type(parameter)}')
+    # Check if the shape of the parameter matches the given size
+    if not are_broadcastable_shapes(parameter.shape, sizes):
+        raise ValueError(f'The shape of the parameter {parameter.shape} does not match with the given size {sizes}')
+    # Expand the parameter to match the given batch size
+    param_value = parameter.value if isinstance(parameter, State) else parameter
+    if batch_size is not None:
+        if param_value.ndim <= len(sizes):
+            # add a new axis to the params so that it matches the dimensionality of the given shape ``sizes``
+            param_value = _expand_params_to_match_sizes(param_value, sizes)
+            param_value = u.math.repeat(
+                u.math.expand_dims(param_value, axis=0),
+                batch_size,
+                axis=0
+            )
+        else:
+            if param_value.shape[0] != batch_size:
+                raise ValueError(f'The batch size of the parameter {param_value.shape[0]} '
+                                 f'does not match with the given batch size {batch_size}')
+    return type(parameter)(param_value) if isinstance(parameter, State) else param_value
+def calculate_init_gain(nonlinearity, param=None):
     r"""Return the recommended gain value for the given nonlinearity function.
     The values are as follows:
@@ -123,7 +294,7 @@ class Normal(Initializer):
       The gain of the derivation of the normal distribution.
     """
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -138,10 +309,11 @@ class Normal(Initializer):
         self.rng = random.default_rng(seed)
         self.unit = unit
-    def __call__(self, shape, dtype: DTypeLike = None):
+    def __call__(self, shape, **kwargs):
         shape = to_size(shape)
-        dtype = dtype or environ.dftype()
-        weights = self.rng.normal(size=shape, loc=self.mean, scale=self.scale, dtype=dtype)
+        dtype = kwargs.get('dtype', environ.dftype())
+        rng = kwargs.get('rng', self.rng)
+        weights = rng.normal(size=shape, loc=self.mean, scale=self.scale, dtype=dtype)
         return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
@@ -164,7 +336,7 @@ class TruncatedNormal(Initializer):
       truncation. Must be broadcast-compatible with ``lower``.
     """
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -184,9 +356,10 @@ class TruncatedNormal(Initializer):
         self.rng = random.default_rng(seed)
         self.unit = unit
-    def __call__(self, shape, dtype: DTypeLike = None, ):
-        dtype = dtype or environ.dftype()
-        weights = self.rng.truncated_normal(
+    def __call__(self, shape, **kwargs):
+        dtype = kwargs.get('dtype', environ.dftype())
+        rng = kwargs.get('rng', self.rng)
+        weights = rng.truncated_normal(
             size=shape,
             scale=self.scale,
             lower=self.lower,
@@ -208,7 +381,7 @@ class Gamma(Initializer):
       The gain of the derivation of the Gamma distribution.
     """
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -222,10 +395,11 @@ class Gamma(Initializer):
         self.rng = random.default_rng(seed)
         self.unit = unit
-    def __call__(self, shape, dtype: DTypeLike = None, ):
+    def __call__(self, shape, **kwargs):
         shape = to_size(shape)
-        dtype = dtype or environ.dftype()
-        weights = self.rng.gamma(self.shape, scale=self.scale, size=shape, dtype=dtype)
+        dtype = kwargs.get('dtype', environ.dftype())
+        rng = kwargs.get('rng', self.rng)
+        weights = rng.gamma(self.shape, scale=self.scale, size=shape, dtype=dtype)
         return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
@@ -238,7 +412,7 @@ class Exponential(Initializer):
       The gain of the derivation of the Exponential distribution.
     """
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -250,10 +424,11 @@ class Exponential(Initializer):
         self.rng = random.default_rng(seed)
         self.unit = unit
-    def __call__(self, shape, dtype: DTypeLike = None, ):
+    def __call__(self, shape, **kwargs):
         shape = to_size(shape)
-        dtype = dtype or environ.dftype()
-        weights = self.rng.exponential(scale=self.scale, size=shape, dtype=dtype)
+        dtype = kwargs.get('dtype', environ.dftype())
+        rng = kwargs.get('rng', self.rng)
+        weights = rng.exponential(scale=self.scale, size=shape, dtype=dtype)
         return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
@@ -267,7 +442,7 @@ class Uniform(Initializer):
     max_val : float
       The upper limit of the uniform distribution.
     """
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -282,15 +457,16 @@ class Uniform(Initializer):
         self.rng = random.default_rng(seed)
         self.unit = unit
-    def __call__(self, shape, dtype: DTypeLike = None, ):
+    def __call__(self, shape, **kwargs):
         shape = to_size(shape)
-        dtype = dtype or environ.dftype()
-        weights = self.rng.uniform(low=self.min_val, high=self.max_val, size=shape, dtype=dtype)
+        dtype = kwargs.get('dtype', environ.dftype())
+        rng = kwargs.get('rng', self.rng)
+        weights = rng.uniform(low=self.min_val, high=self.max_val, size=shape, dtype=dtype)
         return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
 class VarianceScaling(Initializer):
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -312,9 +488,10 @@ class VarianceScaling(Initializer):
         self.rng = random.default_rng(seed)
         self.unit = unit
-    def __call__(self, shape, dtype: DTypeLike = None, ):
+    def __call__(self, shape, **kwargs):
         shape = to_size(shape)
-        dtype = dtype or environ.dftype()
+        dtype = kwargs.get('dtype', environ.dftype())
+        rng = kwargs.get('rng', self.rng)
         fan_in, fan_out = _compute_fans(shape, in_axis=self.in_axis, out_axis=self.out_axis)
         if self.mode == "fan_in":
             denominator = fan_in
@@ -327,11 +504,11 @@ class VarianceScaling(Initializer):
         variance = (self.scale / denominator).astype(dtype)
         if self.distribution == "truncated_normal":
             stddev = (jnp.sqrt(variance) / .87962566103423978).astype(dtype)
-            res = self.rng.truncated_normal(-2, 2, shape, dtype=dtype) * stddev
+            res = rng.truncated_normal(-2, 2, shape, dtype=dtype) * stddev
         elif self.distribution == "normal":
-            res = self.rng.randn(*shape, dtype=dtype) * jnp.sqrt(variance).astype(dtype)
+            res = rng.randn(*shape, dtype=dtype) * jnp.sqrt(variance).astype(dtype)
         elif self.distribution == "uniform":
-            res = (self.rng.uniform(low=-1, high=1, size=shape, dtype=dtype) *
+            res = (rng.uniform(low=-1, high=1, size=shape, dtype=dtype) *
                    jnp.sqrt(3 * variance).astype(dtype))
         else:
             raise ValueError("invalid distribution for variance scaling initializer")
@@ -339,7 +516,7 @@ class VarianceScaling(Initializer):
 class KaimingUniform(VarianceScaling):
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -361,7 +538,7 @@ class KaimingUniform(VarianceScaling):
 class KaimingNormal(VarianceScaling):
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -383,7 +560,7 @@ class KaimingNormal(VarianceScaling):
 class XavierUniform(VarianceScaling):
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -405,7 +582,7 @@ class XavierUniform(VarianceScaling):
 class XavierNormal(VarianceScaling):
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -427,7 +604,7 @@ class XavierNormal(VarianceScaling):
 class LecunUniform(VarianceScaling):
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -449,7 +626,7 @@ class LecunUniform(VarianceScaling):
 class LecunNormal(VarianceScaling):
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -477,7 +654,7 @@ class Orthogonal(Initializer):
     If the shape is not square, the matrix will have orthonormal rows or columns
     depending on which side is smaller.
     """
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -492,13 +669,14 @@ class Orthogonal(Initializer):
         self.rng = random.default_rng(seed)
         self.unit = unit
-    def __call__(self, shape, dtype: DTypeLike = None, ):
-        dtype = dtype or environ.dftype()
+    def __call__(self, shape, **kwargs):
+        dtype = kwargs.get('dtype', environ.dftype())
+        rng = kwargs.get('rng', self.rng)
         shape = to_size(shape)
         n_rows = shape[self.axis]
         n_cols = np.prod(shape) // n_rows
         matrix_shape = (n_rows, n_cols) if n_rows > n_cols else (n_cols, n_rows)
-        norm_dst = self.rng.normal(size=matrix_shape, dtype=dtype)
+        norm_dst = rng.normal(size=matrix_shape, dtype=dtype)
         q_mat, r_mat = jnp.linalg.qr(norm_dst)
         # Enforce Q is uniformly distributed
@@ -517,7 +695,7 @@ class DeltaOrthogonal(Initializer):
     The shape must be 3D, 4D or 5D.
     """
-    __module__ = 'brainstate.init'
+    __module__ = 'brainstate.nn'
     def __init__(
         self,
@@ -532,9 +710,9 @@ class DeltaOrthogonal(Initializer):
         self.orghogonal = Orthogonal(scale=scale, axis=axis, seed=seed)
         self.unit = unit
-    def __call__(self, shape, dtype: DTypeLike = None, ):
+    def __call__(self, shape, **kwargs):
         shape = to_size(shape)
-        dtype = dtype or environ.dftype()
+        dtype = kwargs.get('dtype', environ.dftype())
         if len(shape) not in [3, 4, 5]:
             raise ValueError("Delta orthogonal initializer requires a 3D, 4D or 5D shape.")
         if shape[-1] < shape[-2]:
@@ -551,3 +729,81 @@ class DeltaOrthogonal(Initializer):
             k1, k2, k3 = shape[:3]
             W = W.at[(k1 - 1) // 2, (k2 - 1) // 2, (k3 - 1) // 2].set(ortho_matrix)
         return u.maybe_decimal(u.Quantity(W.mantissa, unit=self.unit))
+class ZeroInit(Initializer):
+    """Zero initializer.
+    Initialize the weights with zeros.
+    """
+    __module__ = 'brainstate.nn'
+    def __init__(self, unit: u.Unit = u.UNITLESS):
+        super(ZeroInit, self).__init__()
+        self.unit = unit
+    def __call__(self, shape, **kwargs):
+        dtype = kwargs.get('dtype', environ.dftype())
+        shape = to_size(shape)
+        return u.maybe_decimal(u.math.zeros(shape, dtype=dtype, unit=self.unit))
+class Constant(Initializer):
+    """Constant initializer.
+    Initialize the weights with the given values.
+    Parameters
+    ----------
+    value : float, int, bm.ndarray
+      The value to specify.
+    """
+    __module__ = 'brainstate.nn'
+    def __init__(self, value=1., ):
+        super(Constant, self).__init__()
+        self.value = value
+    def __call__(self, shape, **kwargs):
+        dtype = kwargs.get('dtype', environ.dftype())
+        shape = to_size(shape)
+        return u.maybe_decimal(u.math.full(shape, self.value, dtype=dtype))
+class Identity(Initializer):
+    """Returns the identity matrix.
+    This initializer was proposed in (Le, et al., 2015) [1]_.
+    Parameters
+    ----------
+    value : float
+      The optional scaling factor.
+    Returns
+    -------
+    shape: tuple of int
+      The weight shape/size.
+    References
+    ----------
+    .. [1] Le, Quoc V., Navdeep Jaitly, and Geoffrey E. Hinton. "A simple way to
+           initialize recurrent networks of rectified linear units." arXiv preprint
+           arXiv:1504.00941 (2015).
+    """
+    __module__ = 'brainstate.nn'
+    def __init__(self, value=1., unit: u.Unit = u.UNITLESS):
+        super(Identity, self).__init__()
+        self.value = value
+        self.unit = unit
+    def __call__(self, shape, **kwargs):
+        dtype = kwargs.get('dtype', environ.dftype())
+        shape = to_size(shape)
+        if isinstance(shape, (tuple, list)):
+            if len(shape) > 2:
+                raise ValueError(f'Only support initialize 2D weights for {self.__class__.__name__}.')
+        r = u.math.eye(*shape, dtype=dtype)
+        r = u.math.fill_diagonal(r, self.value)
+        return u.maybe_decimal(u.Quantity(r, unit=self.unit))

brainstate 0.1.10__py2.py3-none-any.whl → 0.2.0__py2.py3-none-any.whl

brainstate 0.1.10py2.py3-none-any.whl → 0.2.0py2.py3-none-any.whl