PyPI - brainstate - Versions diffs - 0.0.2.post20241009__py2.py3-none-any.whl → 0.1.0__py2.py3-none-any.whl - Mend

brainstate 0.0.2.post20241009py2.py3-none-any.whl → 0.1.0py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (175) hide show

brainstate/__init__.py +31 -11
brainstate/_state.py +760 -316
brainstate/_state_test.py +41 -12
brainstate/_utils.py +31 -4
brainstate/augment/__init__.py +40 -0
brainstate/augment/_autograd.py +608 -0
brainstate/augment/_autograd_test.py +1193 -0
brainstate/augment/_eval_shape.py +102 -0
brainstate/augment/_eval_shape_test.py +40 -0
brainstate/augment/_mapping.py +525 -0
brainstate/augment/_mapping_test.py +210 -0
brainstate/augment/_random.py +99 -0
brainstate/{transform → compile}/__init__.py +25 -13
brainstate/compile/_ad_checkpoint.py +204 -0
brainstate/compile/_ad_checkpoint_test.py +51 -0
brainstate/compile/_conditions.py +259 -0
brainstate/compile/_conditions_test.py +221 -0
brainstate/compile/_error_if.py +94 -0
brainstate/compile/_error_if_test.py +54 -0
brainstate/compile/_jit.py +314 -0
brainstate/compile/_jit_test.py +143 -0
brainstate/compile/_loop_collect_return.py +516 -0
brainstate/compile/_loop_collect_return_test.py +59 -0
brainstate/compile/_loop_no_collection.py +185 -0
brainstate/compile/_loop_no_collection_test.py +51 -0
brainstate/compile/_make_jaxpr.py +756 -0
brainstate/compile/_make_jaxpr_test.py +134 -0
brainstate/compile/_progress_bar.py +111 -0
brainstate/compile/_unvmap.py +159 -0
brainstate/compile/_util.py +147 -0
brainstate/environ.py +408 -381
brainstate/environ_test.py +34 -32
brainstate/{nn/event → event}/__init__.py +6 -6
brainstate/event/_csr.py +308 -0
brainstate/event/_csr_test.py +118 -0
brainstate/event/_fixed_probability.py +271 -0
brainstate/event/_fixed_probability_test.py +128 -0
brainstate/event/_linear.py +219 -0
brainstate/event/_linear_test.py +112 -0
brainstate/{nn/event → event}/_misc.py +7 -7
brainstate/functional/_activations.py +521 -511
brainstate/functional/_activations_test.py +300 -300
brainstate/functional/_normalization.py +43 -43
brainstate/functional/_others.py +15 -15
brainstate/functional/_spikes.py +49 -49
brainstate/graph/__init__.py +33 -0
brainstate/graph/_graph_context.py +443 -0
brainstate/graph/_graph_context_test.py +65 -0
brainstate/graph/_graph_convert.py +246 -0
brainstate/graph/_graph_node.py +300 -0
brainstate/graph/_graph_node_test.py +75 -0
brainstate/graph/_graph_operation.py +1746 -0
brainstate/graph/_graph_operation_test.py +724 -0
brainstate/init/_base.py +28 -10
brainstate/init/_generic.py +175 -172
brainstate/init/_random_inits.py +470 -415
brainstate/init/_random_inits_test.py +150 -0
brainstate/init/_regular_inits.py +66 -69
brainstate/init/_regular_inits_test.py +51 -0
brainstate/mixin.py +236 -244
brainstate/mixin_test.py +44 -46
brainstate/nn/__init__.py +26 -51
brainstate/nn/_collective_ops.py +199 -0
brainstate/nn/_dyn_impl/__init__.py +46 -0
brainstate/nn/_dyn_impl/_dynamics_neuron.py +290 -0
brainstate/nn/_dyn_impl/_dynamics_neuron_test.py +162 -0
brainstate/nn/_dyn_impl/_dynamics_synapse.py +320 -0
brainstate/nn/_dyn_impl/_dynamics_synapse_test.py +132 -0
brainstate/nn/_dyn_impl/_inputs.py +154 -0
brainstate/nn/{_projection/__init__.py → _dyn_impl/_projection_alignpost.py} +6 -13
brainstate/nn/_dyn_impl/_rate_rnns.py +400 -0
brainstate/nn/_dyn_impl/_rate_rnns_test.py +64 -0
brainstate/nn/_dyn_impl/_readout.py +128 -0
brainstate/nn/_dyn_impl/_readout_test.py +54 -0
brainstate/nn/_dynamics/__init__.py +37 -0
brainstate/nn/_dynamics/_dynamics_base.py +631 -0
brainstate/nn/_dynamics/_dynamics_base_test.py +79 -0
brainstate/nn/_dynamics/_projection_base.py +346 -0
brainstate/nn/_dynamics/_state_delay.py +453 -0
brainstate/nn/_dynamics/_synouts.py +161 -0
brainstate/nn/_dynamics/_synouts_test.py +58 -0
brainstate/nn/_elementwise/__init__.py +22 -0
brainstate/nn/_elementwise/_dropout.py +418 -0
brainstate/nn/_elementwise/_dropout_test.py +100 -0
brainstate/nn/_elementwise/_elementwise.py +1122 -0
brainstate/nn/_elementwise/_elementwise_test.py +171 -0
brainstate/nn/_exp_euler.py +97 -0
brainstate/nn/_exp_euler_test.py +36 -0
brainstate/nn/_interaction/__init__.py +32 -0
brainstate/nn/_interaction/_connections.py +726 -0
brainstate/nn/_interaction/_connections_test.py +254 -0
brainstate/nn/_interaction/_embedding.py +59 -0
brainstate/nn/_interaction/_normalizations.py +388 -0
brainstate/nn/_interaction/_normalizations_test.py +75 -0
brainstate/nn/_interaction/_poolings.py +1179 -0
brainstate/nn/_interaction/_poolings_test.py +219 -0
brainstate/nn/_module.py +328 -0
brainstate/nn/_module_test.py +211 -0
brainstate/nn/metrics.py +309 -309
brainstate/optim/__init__.py +14 -2
brainstate/optim/_base.py +66 -0
brainstate/optim/_lr_scheduler.py +363 -400
brainstate/optim/_lr_scheduler_test.py +25 -24
brainstate/optim/_optax_optimizer.py +103 -176
brainstate/optim/_optax_optimizer_test.py +41 -1
brainstate/optim/_sgd_optimizer.py +950 -1025
brainstate/random/_rand_funs.py +3269 -3268
brainstate/random/_rand_funs_test.py +568 -0
brainstate/random/_rand_seed.py +149 -117
brainstate/random/_rand_seed_test.py +50 -0
brainstate/random/_rand_state.py +1360 -1318
brainstate/random/_random_for_unit.py +13 -13
brainstate/surrogate.py +1262 -1243
brainstate/{nn/_projection/_utils.py → transform.py} +1 -2
brainstate/typing.py +157 -130
brainstate/util/__init__.py +52 -0
brainstate/util/_caller.py +100 -0
brainstate/util/_dict.py +734 -0
brainstate/util/_dict_test.py +160 -0
brainstate/util/_error.py +28 -0
brainstate/util/_filter.py +178 -0
brainstate/util/_others.py +497 -0
brainstate/util/_pretty_repr.py +208 -0
brainstate/util/_scaling.py +260 -0
brainstate/util/_struct.py +524 -0
brainstate/util/_tracers.py +75 -0
brainstate/{_visualization.py → util/_visualization.py} +16 -16
{brainstate-0.0.2.post20241009.dist-info → brainstate-0.1.0.dist-info}/METADATA +11 -11
brainstate-0.1.0.dist-info/RECORD +135 -0
brainstate/_module.py +0 -1637
brainstate/_module_test.py +0 -207
brainstate/nn/_base.py +0 -251
brainstate/nn/_connections.py +0 -686
brainstate/nn/_dynamics.py +0 -426
brainstate/nn/_elementwise.py +0 -1438
brainstate/nn/_embedding.py +0 -66
brainstate/nn/_misc.py +0 -133
brainstate/nn/_normalizations.py +0 -389
brainstate/nn/_others.py +0 -101
brainstate/nn/_poolings.py +0 -1229
brainstate/nn/_poolings_test.py +0 -231
brainstate/nn/_projection/_align_post.py +0 -546
brainstate/nn/_projection/_align_pre.py +0 -599
brainstate/nn/_projection/_delta.py +0 -241
brainstate/nn/_projection/_vanilla.py +0 -101
brainstate/nn/_rate_rnns.py +0 -410
brainstate/nn/_readout.py +0 -136
brainstate/nn/_synouts.py +0 -166
brainstate/nn/event/csr.py +0 -312
brainstate/nn/event/csr_test.py +0 -118
brainstate/nn/event/fixed_probability.py +0 -276
brainstate/nn/event/fixed_probability_test.py +0 -127
brainstate/nn/event/linear.py +0 -220
brainstate/nn/event/linear_test.py +0 -111
brainstate/random/random_test.py +0 -593
brainstate/transform/_autograd.py +0 -585
brainstate/transform/_autograd_test.py +0 -1181
brainstate/transform/_conditions.py +0 -334
brainstate/transform/_conditions_test.py +0 -220
brainstate/transform/_error_if.py +0 -94
brainstate/transform/_error_if_test.py +0 -55
brainstate/transform/_jit.py +0 -265
brainstate/transform/_jit_test.py +0 -118
brainstate/transform/_loop_collect_return.py +0 -502
brainstate/transform/_loop_no_collection.py +0 -170
brainstate/transform/_make_jaxpr.py +0 -739
brainstate/transform/_make_jaxpr_test.py +0 -131
brainstate/transform/_mapping.py +0 -109
brainstate/transform/_progress_bar.py +0 -111
brainstate/transform/_unvmap.py +0 -143
brainstate/util.py +0 -746
brainstate-0.0.2.post20241009.dist-info/RECORD +0 -87
{brainstate-0.0.2.post20241009.dist-info → brainstate-0.1.0.dist-info}/LICENSE +0 -0
{brainstate-0.0.2.post20241009.dist-info → brainstate-0.1.0.dist-info}/WHEEL +0 -0
{brainstate-0.0.2.post20241009.dist-info → brainstate-0.1.0.dist-info}/top_level.txt +0 -0

brainstate/init/_random_inits.py CHANGED Viewed

@@ -14,486 +14,541 @@
 # ==============================================================================
 # -*- coding: utf-8 -*-
+from __future__ import annotations
 import math
-import brainunit as bu
+import brainunit as u
 import jax.numpy as jnp
 import numpy as np
 from brainstate import environ, random
-from brainstate.typing import ArrayLike
+from brainstate.typing import ArrayLike, SeedOrKey, DTypeLike
 from ._base import Initializer, to_size
 __all__ = [
-  'Normal',
-  'TruncatedNormal',
-  'Uniform',
-  'VarianceScaling',
-  'KaimingUniform',
-  'KaimingNormal',
-  'XavierUniform',
-  'XavierNormal',
-  'LecunUniform',
-  'LecunNormal',
-  'Orthogonal',
-  'DeltaOrthogonal',
+    'Normal',
+    'TruncatedNormal',
+    'Uniform',
+    'VarianceScaling',
+    'KaimingUniform',
+    'KaimingNormal',
+    'XavierUniform',
+    'XavierNormal',
+    'LecunUniform',
+    'LecunNormal',
+    'Orthogonal',
+    'DeltaOrthogonal',
 ]
 def calculate_gain(nonlinearity, param=None):
-  r"""Return the recommended gain value for the given nonlinearity function.
-  The values are as follows:
-  ================= ====================================================
-  nonlinearity      gain
-  ================= ====================================================
-  Linear / Identity :math:`1`
-  Conv{1,2,3}D      :math:`1`
-  Sigmoid           :math:`1`
-  Tanh              :math:`\frac{5}{3}`
-  ReLU              :math:`\sqrt{2}`
-  Leaky Relu        :math:`\sqrt{\frac{2}{1 + \text{negative\_slope}^2}}`
-  SELU              :math:`\frac{3}{4}`
-  ================= ====================================================
-  .. warning::
-      In order to implement `Self-Normalizing Neural Networks`_ ,
-      you should use ``nonlinearity='linear'`` instead of ``nonlinearity='selu'``.
-      This gives the initial weights a variance of ``1 / N``,
-      which is necessary to induce a stable fixed point in the forward pass.
-      In contrast, the default gain for ``SELU`` sacrifices the normalisation
-      effect for more stable gradient flow in rectangular layers.
-  Args:
-      nonlinearity: the non-linear function (`nn.functional` name)
-      param: optional parameter for the non-linear function
-  .. _Self-Normalizing Neural Networks: https://papers.nips.cc/paper/2017/hash/5d44ee6f2c3f71b73125876103c8f6c4-Abstract.html
-  """
-  linear_fns = ['linear', 'conv1d', 'conv2d', 'conv3d', 'conv_transpose1d', 'conv_transpose2d', 'conv_transpose3d']
-  if nonlinearity in linear_fns or nonlinearity == 'sigmoid':
-    return 1
-  elif nonlinearity == 'tanh':
-    return 5.0 / 3
-  elif nonlinearity == 'relu':
-    return math.sqrt(2.0)
-  elif nonlinearity == 'leaky_relu':
-    if param is None:
-      negative_slope = 0.01
-    elif not isinstance(param, bool) and isinstance(param, int) or isinstance(param, float):
-      # True/False are instances of int, hence check above
-      negative_slope = param
+    r"""Return the recommended gain value for the given nonlinearity function.
+    The values are as follows:
+    ================= ====================================================
+    nonlinearity      gain
+    ================= ====================================================
+    Linear / Identity :math:`1`
+    Conv{1,2,3}D      :math:`1`
+    Sigmoid           :math:`1`
+    Tanh              :math:`\frac{5}{3}`
+    ReLU              :math:`\sqrt{2}`
+    Leaky Relu        :math:`\sqrt{\frac{2}{1 + \text{negative\_slope}^2}}`
+    SELU              :math:`\frac{3}{4}`
+    ================= ====================================================
+    .. warning::
+        In order to implement `Self-Normalizing Neural Networks`_ ,
+        you should use ``nonlinearity='linear'`` instead of ``nonlinearity='selu'``.
+        This gives the initial weights a variance of ``1 / N``,
+        which is necessary to induce a stable fixed point in the forward pass.
+        In contrast, the default gain for ``SELU`` sacrifices the normalisation
+        effect for more stable gradient flow in rectangular layers.
+    Args:
+        nonlinearity: the non-linear function (`nn.functional` name)
+        param: optional parameter for the non-linear function
+    .. _Self-Normalizing Neural Networks: https://papers.nips.cc/paper/2017/hash/5d44ee6f2c3f71b73125876103c8f6c4-Abstract.html
+    """
+    linear_fns = ['linear', 'conv1d', 'conv2d', 'conv3d', 'conv_transpose1d', 'conv_transpose2d', 'conv_transpose3d']
+    if nonlinearity in linear_fns or nonlinearity == 'sigmoid':
+        return 1
+    elif nonlinearity == 'tanh':
+        return 5.0 / 3
+    elif nonlinearity == 'relu':
+        return math.sqrt(2.0)
+    elif nonlinearity == 'leaky_relu':
+        if param is None:
+            negative_slope = 0.01
+        elif not isinstance(param, bool) and isinstance(param, int) or isinstance(param, float):
+            # True/False are instances of int, hence check above
+            negative_slope = param
+        else:
+            raise ValueError("negative_slope {} not a valid number".format(param))
+        return math.sqrt(2.0 / (1 + negative_slope ** 2))
+    elif nonlinearity == 'selu':
+        return 3.0 / 4
     else:
-      raise ValueError("negative_slope {} not a valid number".format(param))
-    return math.sqrt(2.0 / (1 + negative_slope ** 2))
-  elif nonlinearity == 'selu':
-    return 3.0 / 4
-  else:
-    raise ValueError("Unsupported nonlinearity {}".format(nonlinearity))
+        raise ValueError("Unsupported nonlinearity {}".format(nonlinearity))
 def _format_shape(shape):
-  if isinstance(shape, int):
-    return (shape,)
-  if len(shape) == 0:
-    raise ValueError('Please provide shape.')
-  if len(shape) == 1:
-    if isinstance(shape[0], (tuple, list)):
-      return shape[0]
+    if isinstance(shape, int):
+        return (shape,)
+    if len(shape) == 0:
+        raise ValueError('Please provide shape.')
+    if len(shape) == 1:
+        if isinstance(shape[0], (tuple, list)):
+            return shape[0]
+        else:
+            return shape
     else:
-      return shape
-  else:
-    return shape
+        return shape
 def _compute_fans(shape, in_axis=-2, out_axis=-1):
-  receptive_field_size = np.prod(shape) / shape[in_axis] / shape[out_axis]
-  fan_in = shape[in_axis] * receptive_field_size
-  fan_out = shape[out_axis] * receptive_field_size
-  return fan_in, fan_out
+    receptive_field_size = np.prod(shape) / shape[in_axis] / shape[out_axis]
+    fan_in = shape[in_axis] * receptive_field_size
+    fan_out = shape[out_axis] * receptive_field_size
+    return fan_in, fan_out
 class Normal(Initializer):
-  """Initialize weights with normal distribution.
-  Parameters
-  ----------
-  scale : float
-    The gain of the derivation of the normal distribution.
-  """
-  def __init__(self, mean=0., scale=1., dtype=None):
-    super(Normal, self).__init__()
-    self.scale = scale
-    self.mean = mean
-    self.dtype = dtype or environ.dftype()
-  def __call__(self, shape):
-    shape = to_size(shape)
-    weights = random.normal(size=shape, loc=self.mean, scale=self.scale, dtype=self.dtype)
-    return weights
-  def __repr__(self):
-    return f'{self.__class__.__name__}(scale={self.scale}, dtype={self.dtype})'
+    """Initialize weights with normal distribution.
+    Parameters
+    ----------
+    scale : float
+      The gain of the derivation of the normal distribution.
+    """
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        mean: ArrayLike = 0.,
+        scale: ArrayLike = 1.,
+        unit: u.Unit = u.UNITLESS,
+        seed: SeedOrKey = None
+    ):
+        super().__init__()
+        self.scale = scale
+        self.mean = mean
+        self.rng = random.default_rng(seed)
+        self.unit = unit
+    def __call__(self, shape, dtype: DTypeLike = None):
+        shape = to_size(shape)
+        dtype = dtype or environ.dftype()
+        weights = self.rng.normal(size=shape, loc=self.mean, scale=self.scale, dtype=dtype)
+        return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
 class TruncatedNormal(Initializer):
-  """Initialize weights with truncated normal distribution.
-  Parameters
-  ----------
-  loc : float, ndarray
-    Mean ("centre") of the distribution before truncating. Note that
-    the mean of the truncated distribution will not be exactly equal
-    to ``loc``.
-  scale : float
-    The standard deviation of the normal distribution before truncating.
-  lower : float, ndarray
-    A float or array of floats representing the lower bound for
-      truncation. Must be broadcast-compatible with ``upper``.
-  upper : float, ndarray
-    A float or array of floats representing the  upper bound for
-    truncation. Must be broadcast-compatible with ``lower``.
-  """
-  def __init__(self, loc=0., scale=1., lower=None, upper=None, dtype=None):
-    super(TruncatedNormal, self).__init__()
-    assert scale > 0, '`scale` must be positive.'
-    self.scale = scale
-    self.loc = loc
-    self.lower = lower
-    self.upper = upper
-    self.dtype = dtype or environ.dftype()
-  def __call__(self, shape):
-    weights = random.truncated_normal(
-      size=shape,
-      scale=self.scale,
-      lower=self.lower,
-      upper=self.upper,
-      loc=self.loc,
-      dtype=self.dtype
-    )
-    return weights
-  def __repr__(self):
-    return (f'{self.__class__.__name__}(loc={self.loc}, scale={self.scale}, '
-            f'lower={self.lower}, upper={self.upper}, dtype={self.dtype})')
+    """Initialize weights with truncated normal distribution.
+    Parameters
+    ----------
+    loc : float, ndarray
+      Mean ("centre") of the distribution before truncating. Note that
+      the mean of the truncated distribution will not be exactly equal
+      to ``loc``.
+    scale : float
+      The standard deviation of the normal distribution before truncating.
+    lower : float, ndarray
+      A float or array of floats representing the lower bound for
+        truncation. Must be broadcast-compatible with ``upper``.
+    upper : float, ndarray
+      A float or array of floats representing the  upper bound for
+      truncation. Must be broadcast-compatible with ``lower``.
+    """
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        loc: ArrayLike = 0.,
+        scale: ArrayLike = 1.,
+        unit: u.Unit = u.UNITLESS,
+        lower: ArrayLike = None,
+        upper: ArrayLike = None,
+        seed: SeedOrKey = None,
+    ):
+        super().__init__()
+        assert scale > 0, '`scale` must be positive.'
+        self.scale = scale
+        self.loc = loc
+        self.lower = lower
+        self.upper = upper
+        self.rng = random.default_rng(seed)
+        self.unit = unit
+    def __call__(self, shape, dtype: DTypeLike = None, ):
+        dtype = dtype or environ.dftype()
+        weights = self.rng.truncated_normal(
+            size=shape,
+            scale=self.scale,
+            lower=self.lower,
+            upper=self.upper,
+            loc=self.loc,
+            dtype=dtype
+        )
+        return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
 class Gamma(Initializer):
-  """Initialize weights with Gamma distribution.
-  Parameters
-  ----------
-  shape: float, Array
-    Shape parameter.
-  scale: float, Array
-    The gain of the derivation of the Gamma distribution.
-  """
-  def __init__(self, shape, scale=None, dtype=None):
-    self.shape = shape
-    self.scale = scale
-    self.dtype = dtype or environ.dftype()
-  def __call__(self, shape):
-    shape = to_size(shape)
-    weights = random.gamma(self.shape, scale=self.scale, size=shape, dtype=self.dtype)
-    return weights
-  def __repr__(self):
-    return f'{self.__class__.__name__}(shape={self.shape}, scale={self.scale}, dtype={self.dtype})'
+    """Initialize weights with Gamma distribution.
+    Parameters
+    ----------
+    shape: float, Array
+      Shape parameter.
+    scale: float, Array
+      The gain of the derivation of the Gamma distribution.
+    """
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        shape: ArrayLike,
+        unit: u.Unit = u.UNITLESS,
+        scale: ArrayLike = None,
+        seed: SeedOrKey = None
+    ):
+        self.shape = shape
+        self.scale = scale
+        self.rng = random.default_rng(seed)
+        self.unit = unit
+    def __call__(self, shape, dtype: DTypeLike = None, ):
+        shape = to_size(shape)
+        dtype = dtype or environ.dftype()
+        weights = self.rng.gamma(self.shape, scale=self.scale, size=shape, dtype=dtype)
+        return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
 class Exponential(Initializer):
-  """Initialize weights with Gamma distribution.
+    """Initialize weights with Gamma distribution.
-  Parameters
-  ----------
-  scale: float, Array
-    The gain of the derivation of the Exponential distribution.
+    Parameters
+    ----------
+    scale: float, Array
+      The gain of the derivation of the Exponential distribution.
-  """
+    """
+    __module__ = 'brainstate.init'
-  def __init__(self, scale=None, dtype=None):
-    self.scale = scale
-    self.dtype = dtype or environ.dftype()
+    def __init__(
+        self,
+        scale: ArrayLike = None,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        self.scale = scale
+        self.rng = random.default_rng(seed)
+        self.unit = unit
-  def __call__(self, shape):
-    shape = to_size(shape)
-    weights = random.exponential(scale=self.scale, size=shape, dtype=self.dtype)
-    return weights
-  def __repr__(self):
-    return f'{self.__class__.__name__}(scale={self.scale}, dtype={self.dtype})'
+    def __call__(self, shape, dtype: DTypeLike = None, ):
+        shape = to_size(shape)
+        dtype = dtype or environ.dftype()
+        weights = self.rng.exponential(scale=self.scale, size=shape, dtype=dtype)
+        return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
 class Uniform(Initializer):
-  """Initialize weights with uniform distribution.
-  Parameters
-  ----------
-  min_val : float
-    The lower limit of the uniform distribution.
-  max_val : float
-    The upper limit of the uniform distribution.
-  """
-  def __init__(self, min_val: float = 0., max_val: float = 1., dtype=None):
-    super(Uniform, self).__init__()
-    self.min_val = min_val
-    self.max_val = max_val
-    self.dtype = dtype or environ.dftype()
-  def __call__(self, shape):
-    shape = to_size(shape)
-    return random.uniform(low=self.min_val, high=self.max_val, size=shape, dtype=self.dtype)
-  def __repr__(self):
-    return (f'{self.__class__.__name__}(min_val={self.min_val}, '
-            f'max_val={self.max_val}, dtype={self.dtype})')
+    """Initialize weights with uniform distribution.
+    Parameters
+    ----------
+    min_val : float
+      The lower limit of the uniform distribution.
+    max_val : float
+      The upper limit of the uniform distribution.
+    """
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        min_val: ArrayLike = 0.,
+        max_val: ArrayLike = 1.,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super(Uniform, self).__init__()
+        self.min_val = min_val
+        self.max_val = max_val
+        self.rng = random.default_rng(seed)
+        self.unit = unit
+    def __call__(self, shape, dtype: DTypeLike = None, ):
+        shape = to_size(shape)
+        dtype = dtype or environ.dftype()
+        weights = self.rng.uniform(low=self.min_val, high=self.max_val, size=shape, dtype=dtype)
+        return u.maybe_decimal(u.Quantity(weights, unit=self.unit))
 class VarianceScaling(Initializer):
-  def __init__(
-      self,
-      scale: ArrayLike,
-      mode: str,
-      distribution: str,
-      in_axis: int = -2,
-      out_axis: int = -1,
-      dtype=None
-  ):
-    assert mode in ['fan_in', 'fan_out', 'fan_avg']
-    assert distribution in ['truncated_normal', 'normal', 'uniform']
-    self.scale = scale
-    self.mode = mode
-    self.in_axis = in_axis
-    self.out_axis = out_axis
-    self.distribution = distribution
-    self.dtype = dtype or environ.dftype()
-  def __call__(self, shape):
-    shape = to_size(shape)
-    fan_in, fan_out = _compute_fans(shape, in_axis=self.in_axis, out_axis=self.out_axis)
-    if self.mode == "fan_in":
-      denominator = fan_in
-    elif self.mode == "fan_out":
-      denominator = fan_out
-    elif self.mode == "fan_avg":
-      denominator = (fan_in + fan_out) / 2
-    else:
-      raise ValueError("invalid mode for variance scaling initializer: {}".format(self.mode))
-    scale = self.scale.mantissa if isinstance(self.scale, bu.Quantity) else self.scale
-    unit = bu.get_unit(self.scale)
-    variance = (scale / denominator).astype(self.dtype)
-    if self.distribution == "truncated_normal":
-      stddev = (jnp.sqrt(variance) / .87962566103423978).astype(self.dtype)
-      res = random.truncated_normal(-2, 2, shape, dtype=self.dtype) * stddev
-    elif self.distribution == "normal":
-      res = random.randn(*shape, dtype=self.dtype) * jnp.sqrt(variance).astype(self.dtype)
-    elif self.distribution == "uniform":
-      res = (random.uniform(low=-1, high=1, size=shape, dtype=self.dtype) *
-             jnp.sqrt(3 * variance).astype(self.dtype))
-    else:
-      raise ValueError("invalid distribution for variance scaling initializer")
-    return res if unit.is_unitless else bu.Quantity(res, unit=unit)
-  def __repr__(self):
-    name = self.__class__.__name__
-    blank = ' ' * len(name)
-    return (f'{name}(scale={self.scale}, mode={self.mode}, in_axis={self.in_axis}, \n'
-            f'{blank}out_axis={self.out_axis}, distribution={self.distribution}, dtype={self.dtype})')
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: ArrayLike,
+        mode: str,
+        distribution: str,
+        in_axis: int = -2,
+        out_axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        assert mode in ['fan_in', 'fan_out', 'fan_avg']
+        assert distribution in ['truncated_normal', 'normal', 'uniform']
+        self.scale = scale
+        self.mode = mode
+        self.in_axis = in_axis
+        self.out_axis = out_axis
+        self.distribution = distribution
+        self.rng = random.default_rng(seed)
+        self.unit = unit
+    def __call__(self, shape, dtype: DTypeLike = None, ):
+        shape = to_size(shape)
+        dtype = dtype or environ.dftype()
+        fan_in, fan_out = _compute_fans(shape, in_axis=self.in_axis, out_axis=self.out_axis)
+        if self.mode == "fan_in":
+            denominator = fan_in
+        elif self.mode == "fan_out":
+            denominator = fan_out
+        elif self.mode == "fan_avg":
+            denominator = (fan_in + fan_out) / 2
+        else:
+            raise ValueError("invalid mode for variance scaling initializer: {}".format(self.mode))
+        variance = (self.scale / denominator).astype(dtype)
+        if self.distribution == "truncated_normal":
+            stddev = (jnp.sqrt(variance) / .87962566103423978).astype(dtype)
+            res = self.rng.truncated_normal(-2, 2, shape, dtype=dtype) * stddev
+        elif self.distribution == "normal":
+            res = self.rng.randn(*shape, dtype=dtype) * jnp.sqrt(variance).astype(dtype)
+        elif self.distribution == "uniform":
+            res = (self.rng.uniform(low=-1, high=1, size=shape, dtype=dtype) *
+                   jnp.sqrt(3 * variance).astype(dtype))
+        else:
+            raise ValueError("invalid distribution for variance scaling initializer")
+        return u.maybe_decimal(u.Quantity(res, unit=self.unit))
 class KaimingUniform(VarianceScaling):
-  def __init__(
-      self,
-      scale: float = 2.0,
-      mode: str = "fan_in",
-      distribution: str = "uniform",
-      in_axis: int = -2,
-      out_axis: int = -1,
-      dtype=None
-  ):
-    super().__init__(scale,
-                     mode,
-                     distribution,
-                     in_axis=in_axis,
-                     out_axis=out_axis,
-                     dtype=dtype)
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: float = 2.0,
+        mode: str = "fan_in",
+        distribution: str = "uniform",
+        in_axis: int = -2,
+        out_axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super().__init__(scale,
+                         mode,
+                         distribution,
+                         in_axis=in_axis,
+                         out_axis=out_axis,
+                         seed=seed,
+                         unit=unit)
 class KaimingNormal(VarianceScaling):
-  def __init__(
-      self,
-      scale: float = 2.0,
-      mode: str = "fan_in",
-      distribution: str = "truncated_normal",
-      in_axis: int = -2,
-      out_axis: int = -1,
-      dtype=None
-  ):
-    super().__init__(scale,
-                     mode,
-                     distribution,
-                     in_axis=in_axis,
-                     out_axis=out_axis,
-                     dtype=dtype)
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: float = 2.0,
+        mode: str = "fan_in",
+        distribution: str = "truncated_normal",
+        in_axis: int = -2,
+        out_axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super().__init__(scale,
+                         mode,
+                         distribution,
+                         in_axis=in_axis,
+                         out_axis=out_axis,
+                         seed=seed,
+                         unit=unit)
 class XavierUniform(VarianceScaling):
-  def __init__(
-      self,
-      scale: float = 1.0,
-      mode: str = "fan_avg",
-      distribution: str = "uniform",
-      in_axis: int = -2,
-      out_axis: int = -1,
-      dtype=None
-  ):
-    super().__init__(scale,
-                     mode,
-                     distribution,
-                     in_axis=in_axis,
-                     out_axis=out_axis,
-                     dtype=dtype)
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: float = 1.0,
+        mode: str = "fan_avg",
+        distribution: str = "uniform",
+        in_axis: int = -2,
+        out_axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super().__init__(scale,
+                         mode,
+                         distribution,
+                         in_axis=in_axis,
+                         out_axis=out_axis,
+                         seed=seed,
+                         unit=unit)
 class XavierNormal(VarianceScaling):
-  def __init__(
-      self,
-      scale: float = 1.0,
-      mode: str = "fan_avg",
-      distribution: str = "truncated_normal",
-      in_axis: int = -2,
-      out_axis: int = -1,
-      dtype=None
-  ):
-    super().__init__(scale,
-                     mode,
-                     distribution,
-                     in_axis=in_axis,
-                     out_axis=out_axis,
-                     dtype=dtype)
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: float = 1.0,
+        mode: str = "fan_avg",
+        distribution: str = "truncated_normal",
+        in_axis: int = -2,
+        out_axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super().__init__(scale,
+                         mode,
+                         distribution,
+                         in_axis=in_axis,
+                         out_axis=out_axis,
+                         seed=seed,
+                         unit=unit)
 class LecunUniform(VarianceScaling):
-  def __init__(
-      self,
-      scale: float = 1.0,
-      mode: str = "fan_in",
-      distribution: str = "uniform",
-      in_axis: int = -2,
-      out_axis: int = -1,
-      dtype=None
-  ):
-    super().__init__(scale,
-                     mode,
-                     distribution,
-                     in_axis=in_axis,
-                     out_axis=out_axis,
-                     dtype=dtype)
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: float = 1.0,
+        mode: str = "fan_in",
+        distribution: str = "uniform",
+        in_axis: int = -2,
+        out_axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super().__init__(scale,
+                         mode,
+                         distribution,
+                         in_axis=in_axis,
+                         out_axis=out_axis,
+                         seed=seed,
+                         unit=unit)
 class LecunNormal(VarianceScaling):
-  def __init__(
-      self,
-      scale: float = 1.0,
-      mode: str = "fan_in",
-      distribution: str = "truncated_normal",
-      in_axis: int = -2,
-      out_axis: int = -1,
-      dtype=None
-  ):
-    super().__init__(scale,
-                     mode,
-                     distribution,
-                     in_axis=in_axis,
-                     out_axis=out_axis,
-                     dtype=dtype)
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: float = 1.0,
+        mode: str = "fan_in",
+        distribution: str = "truncated_normal",
+        in_axis: int = -2,
+        out_axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super().__init__(scale,
+                         mode,
+                         distribution,
+                         in_axis=in_axis,
+                         out_axis=out_axis,
+                         seed=seed,
+                         unit=unit)
 class Orthogonal(Initializer):
-  """
-  Construct an initializer for uniformly distributed orthogonal matrices.
-  If the shape is not square, the matrix will have orthonormal rows or columns
-  depending on which side is smaller.
-  """
-  def __init__(
-      self,
-      scale: ArrayLike = 1.,
-      axis: int = -1,
-      dtype=None
-  ):
-    super().__init__()
-    self.scale = scale
-    self.axis = axis
-    self.dtype = dtype or environ.dftype()
-  def __call__(self, shape):
-    shape = to_size(shape)
-    n_rows = shape[self.axis]
-    n_cols = np.prod(shape) // n_rows
-    matrix_shape = (n_rows, n_cols) if n_rows > n_cols else (n_cols, n_rows)
-    norm_dst = random.normal(size=matrix_shape, dtype=self.dtype)
-    scale = self.scale.mantissa if isinstance(self.scale, bu.Quantity) else self.scale
-    unit = bu.get_unit(self.scale)
-    q_mat, r_mat = jnp.linalg.qr(norm_dst)
-    # Enforce Q is uniformly distributed
-    q_mat *= jnp.sign(jnp.diag(r_mat))
-    if n_rows < n_cols:
-      q_mat = q_mat.T
-    q_mat = jnp.reshape(q_mat, (n_rows,) + tuple(np.delete(shape, self.axis)))
-    q_mat = jnp.moveaxis(q_mat, 0, self.axis)
-    r = jnp.asarray(scale, dtype=self.dtype) * q_mat
-    return r if unit.is_unitless else bu.Quantity(r, unit=unit)
-  def __repr__(self):
-    return f'{self.__class__.__name__}(scale={self.scale}, axis={self.axis}, dtype={self.dtype})'
+    """
+    Construct an initializer for uniformly distributed orthogonal matrices.
+    If the shape is not square, the matrix will have orthonormal rows or columns
+    depending on which side is smaller.
+    """
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: ArrayLike = 1.,
+        axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super().__init__()
+        self.scale = scale
+        self.axis = axis
+        self.rng = random.default_rng(seed)
+        self.unit = unit
+    def __call__(self, shape, dtype: DTypeLike = None, ):
+        dtype = dtype or environ.dftype()
+        shape = to_size(shape)
+        n_rows = shape[self.axis]
+        n_cols = np.prod(shape) // n_rows
+        matrix_shape = (n_rows, n_cols) if n_rows > n_cols else (n_cols, n_rows)
+        norm_dst = self.rng.normal(size=matrix_shape, dtype=dtype)
+        q_mat, r_mat = jnp.linalg.qr(norm_dst)
+        # Enforce Q is uniformly distributed
+        q_mat *= jnp.sign(jnp.diag(r_mat))
+        if n_rows < n_cols:
+            q_mat = q_mat.T
+        q_mat = jnp.reshape(q_mat, (n_rows,) + tuple(np.delete(shape, self.axis)))
+        q_mat = jnp.moveaxis(q_mat, 0, self.axis)
+        r = jnp.asarray(self.scale, dtype=dtype) * q_mat
+        return u.maybe_decimal(u.Quantity(r, unit=self.unit))
 class DeltaOrthogonal(Initializer):
-  """
-  Construct an initializer for delta orthogonal kernels; see arXiv:1806.05393.
-  The shape must be 3D, 4D or 5D.
-  """
-  def __init__(self, scale=1.0, axis=-1, dtype=None):
-    super(DeltaOrthogonal, self).__init__()
-    self.scale = scale
-    self.axis = axis
-    self.dtype = dtype or environ.dftype()
-  def __call__(self, shape):
-    shape = to_size(shape)
-    if len(shape) not in [3, 4, 5]:
-      raise ValueError("Delta orthogonal initializer requires a 3D, 4D or 5D shape.")
-    if shape[-1] < shape[-2]:
-      raise ValueError("`fan_in` must be less or equal than `fan_out`. ")
-    scale = self.scale.mantissa if isinstance(self.scale, bu.Quantity) else self.scale
-    unit = bu.get_unit(self.scale)
-    ortho_matrix = Orthogonal(scale=scale, axis=self.axis, dtype=self.dtype)(*shape[-2:])
-    W = jnp.zeros(shape, dtype=self.dtype)
-    if len(shape) == 3:
-      k = shape[0]
-      W = W.at[(k - 1) // 2].set(ortho_matrix)
-    elif len(shape) == 4:
-      k1, k2 = shape[:2]
-      W = W.at[(k1 - 1) // 2, (k2 - 1) // 2].set(ortho_matrix)
-    else:
-      k1, k2, k3 = shape[:3]
-      W = W.at[(k1 - 1) // 2, (k2 - 1) // 2, (k3 - 1) // 2].set(ortho_matrix)
-    return W if unit.is_unitless else bu.Quantity(W, unit=unit)
-  def __repr__(self):
-    return f'{self.__class__.__name__}(scale={self.scale}, axis={self.axis}, dtype={self.dtype})'
+    """
+    Construct an initializer for delta orthogonal kernels; see arXiv:1806.05393.
+    The shape must be 3D, 4D or 5D.
+    """
+    __module__ = 'brainstate.init'
+    def __init__(
+        self,
+        scale: ArrayLike = 1.0,
+        axis: int = -1,
+        seed: SeedOrKey = None,
+        unit: u.Unit = u.UNITLESS,
+    ):
+        super().__init__()
+        self.scale = scale
+        self.axis = axis
+        self.orghogonal = Orthogonal(scale=scale, axis=axis, seed=seed)
+        self.unit = unit
+    def __call__(self, shape, dtype: DTypeLike = None, ):
+        shape = to_size(shape)
+        dtype = dtype or environ.dftype()
+        if len(shape) not in [3, 4, 5]:
+            raise ValueError("Delta orthogonal initializer requires a 3D, 4D or 5D shape.")
+        if shape[-1] < shape[-2]:
+            raise ValueError("`fan_in` must be less or equal than `fan_out`. ")
+        ortho_matrix = u.Quantity(self.orghogonal(shape[-2:]))
+        W = u.Quantity(u.math.zeros(shape, dtype=dtype), unit=u.get_unit(ortho_matrix))
+        if len(shape) == 3:
+            k = shape[0]
+            W = W.at[(k - 1) // 2].set(ortho_matrix)
+        elif len(shape) == 4:
+            k1, k2 = shape[:2]
+            W = W.at[(k1 - 1) // 2, (k2 - 1) // 2].set(ortho_matrix)
+        else:
+            k1, k2, k3 = shape[:3]
+            W = W.at[(k1 - 1) // 2, (k2 - 1) // 2, (k3 - 1) // 2].set(ortho_matrix)
+        return u.maybe_decimal(u.Quantity(W.mantissa, unit=self.unit))

brainstate 0.0.2.post20241009__py2.py3-none-any.whl → 0.1.0__py2.py3-none-any.whl

brainstate 0.0.2.post20241009py2.py3-none-any.whl → 0.1.0py2.py3-none-any.whl