PyPI - brainstate - Versions diffs - 0.2.1__py2.py3-none-any.whl → 0.2.2__py2.py3-none-any.whl - Mend

brainstate 0.2.1py2.py3-none-any.whl → 0.2.2py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

brainstate/__init__.py +167 -169
brainstate/_compatible_import.py +340 -340
brainstate/_compatible_import_test.py +681 -681
brainstate/_deprecation.py +210 -210
brainstate/_deprecation_test.py +2297 -2319
brainstate/_error.py +45 -45
brainstate/_state.py +2157 -1652
brainstate/_state_test.py +1129 -52
brainstate/_utils.py +47 -47
brainstate/environ.py +1495 -1495
brainstate/environ_test.py +1223 -1223
brainstate/graph/__init__.py +22 -22
brainstate/graph/_node.py +240 -240
brainstate/graph/_node_test.py +589 -589
brainstate/graph/_operation.py +1620 -1624
brainstate/graph/_operation_test.py +1147 -1147
brainstate/mixin.py +1447 -1433
brainstate/mixin_test.py +1017 -1017
brainstate/nn/__init__.py +146 -137
brainstate/nn/_activations.py +1100 -1100
brainstate/nn/_activations_test.py +354 -354
brainstate/nn/_collective_ops.py +635 -633
brainstate/nn/_collective_ops_test.py +774 -774
brainstate/nn/_common.py +226 -226
brainstate/nn/_common_test.py +134 -154
brainstate/nn/_conv.py +2010 -2010
brainstate/nn/_conv_test.py +849 -849
brainstate/nn/_delay.py +575 -575
brainstate/nn/_delay_test.py +243 -243
brainstate/nn/_dropout.py +618 -618
brainstate/nn/_dropout_test.py +480 -477
brainstate/nn/_dynamics.py +870 -1267
brainstate/nn/_dynamics_test.py +53 -67
brainstate/nn/_elementwise.py +1298 -1298
brainstate/nn/_elementwise_test.py +829 -829
brainstate/nn/_embedding.py +408 -408
brainstate/nn/_embedding_test.py +156 -156
brainstate/nn/_event_fixedprob.py +233 -233
brainstate/nn/_event_fixedprob_test.py +115 -115
brainstate/nn/_event_linear.py +83 -83
brainstate/nn/_event_linear_test.py +121 -121
brainstate/nn/_exp_euler.py +254 -254
brainstate/nn/_exp_euler_test.py +377 -377
brainstate/nn/_linear.py +744 -744
brainstate/nn/_linear_test.py +475 -475
brainstate/nn/_metrics.py +1070 -1070
brainstate/nn/_metrics_test.py +611 -611
brainstate/nn/_module.py +391 -384
brainstate/nn/_module_test.py +40 -40
brainstate/nn/_normalizations.py +1334 -1334
brainstate/nn/_normalizations_test.py +699 -699
brainstate/nn/_paddings.py +1020 -1020
brainstate/nn/_paddings_test.py +722 -722
brainstate/nn/_poolings.py +2239 -2239
brainstate/nn/_poolings_test.py +952 -952
brainstate/nn/_rnns.py +946 -946
brainstate/nn/_rnns_test.py +592 -592
brainstate/nn/_utils.py +216 -216
brainstate/nn/_utils_test.py +401 -401
brainstate/nn/init.py +809 -809
brainstate/nn/init_test.py +180 -180
brainstate/random/__init__.py +270 -270
brainstate/random/{_rand_funs.py → _fun.py} +3938 -3938
brainstate/random/{_rand_funs_test.py → _fun_test.py} +638 -640
brainstate/random/_impl.py +672 -0
brainstate/random/{_rand_seed.py → _seed.py} +675 -675
brainstate/random/{_rand_seed_test.py → _seed_test.py} +48 -48
brainstate/random/{_rand_state.py → _state.py} +1320 -1617
brainstate/random/{_rand_state_test.py → _state_test.py} +551 -551
brainstate/transform/__init__.py +56 -59
brainstate/transform/_ad_checkpoint.py +176 -176
brainstate/transform/_ad_checkpoint_test.py +49 -49
brainstate/transform/_autograd.py +1025 -1025
brainstate/transform/_autograd_test.py +1289 -1289
brainstate/transform/_conditions.py +316 -316
brainstate/transform/_conditions_test.py +220 -220
brainstate/transform/_error_if.py +94 -94
brainstate/transform/_error_if_test.py +52 -52
brainstate/transform/_find_state.py +200 -0
brainstate/transform/_find_state_test.py +84 -0
brainstate/transform/_jit.py +399 -399
brainstate/transform/_jit_test.py +143 -143
brainstate/transform/_loop_collect_return.py +675 -675
brainstate/transform/_loop_collect_return_test.py +58 -58
brainstate/transform/_loop_no_collection.py +283 -283
brainstate/transform/_loop_no_collection_test.py +50 -50
brainstate/transform/_make_jaxpr.py +2176 -2016
brainstate/transform/_make_jaxpr_test.py +1634 -1510
brainstate/transform/_mapping.py +607 -529
brainstate/transform/_mapping_test.py +104 -194
brainstate/transform/_progress_bar.py +255 -255
brainstate/transform/_unvmap.py +256 -256
brainstate/transform/_util.py +286 -286
brainstate/typing.py +837 -837
brainstate/typing_test.py +780 -780
brainstate/util/__init__.py +27 -27
brainstate/util/_others.py +1024 -1024
brainstate/util/_others_test.py +962 -962
brainstate/util/_pretty_pytree.py +1301 -1301
brainstate/util/_pretty_pytree_test.py +675 -675
brainstate/util/_pretty_repr.py +462 -462
brainstate/util/_pretty_repr_test.py +696 -696
brainstate/util/filter.py +945 -945
brainstate/util/filter_test.py +911 -911
brainstate/util/struct.py +910 -910
brainstate/util/struct_test.py +602 -602
{brainstate-0.2.1.dist-info → brainstate-0.2.2.dist-info}/METADATA +108 -108
brainstate-0.2.2.dist-info/RECORD +111 -0
{brainstate-0.2.1.dist-info → brainstate-0.2.2.dist-info}/licenses/LICENSE +202 -202
brainstate/transform/_eval_shape.py +0 -145
brainstate/transform/_eval_shape_test.py +0 -38
brainstate/transform/_random.py +0 -171
brainstate-0.2.1.dist-info/RECORD +0 -111
{brainstate-0.2.1.dist-info → brainstate-0.2.2.dist-info}/WHEEL +0 -0
{brainstate-0.2.1.dist-info → brainstate-0.2.2.dist-info}/top_level.txt +0 -0

brainstate/nn/_elementwise.py CHANGED Viewed

@@ -1,1298 +1,1298 @@
-# Copyright 2024 BrainX Ecosystem Limited. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-# -*- coding: utf-8 -*-
-from typing import Optional
-import brainunit as u
-import jax.numpy as jnp
-from brainstate._state import ParamState
-from brainstate.typing import ArrayLike
-from . import _activations as F
-from ._module import ElementWiseBlock
-__all__ = [
-    # activation functions
-    'Threshold', 'ReLU', 'RReLU', 'Hardtanh', 'ReLU6', 'Sigmoid', 'Hardsigmoid',
-    'Tanh', 'SiLU', 'Mish', 'Hardswish', 'ELU', 'CELU', 'SELU', 'GLU', 'GELU',
-    'Hardshrink', 'LeakyReLU', 'LogSigmoid', 'Softplus', 'Softshrink', 'PReLU',
-    'Softsign', 'Tanhshrink', 'Softmin', 'Softmax', 'Softmax2d', 'LogSoftmax',
-    # others
-    'Identity', 'SpikeBitwise',
-]
-class Threshold(ElementWiseBlock):
-    r"""Thresholds each element of the input Tensor.
-    Threshold is defined as:
-    .. math::
-        y =
-        \begin{cases}
-        x, &\text{ if } x > \text{threshold} \\
-        \text{value}, &\text{ otherwise }
-        \end{cases}
-    Parameters
-    ----------
-    threshold : float
-        The value to threshold at.
-    value : float
-        The value to replace with.
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Threshold(0.1, 20)
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    threshold: float
-    value: float
-    def __init__(self, threshold: float, value: float) -> None:
-        super().__init__()
-        self.threshold = threshold
-        self.value = value
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        dtype = u.math.get_dtype(x)
-        return jnp.where(x > jnp.asarray(self.threshold, dtype=dtype),
-                         x,
-                         jnp.asarray(self.value, dtype=dtype))
-    def __repr__(self):
-        return f'{self.__class__.__name__}(threshold={self.threshold}, value={self.value})'
-class ReLU(ElementWiseBlock):
-    r"""Applies the rectified linear unit function element-wise.
-    The ReLU function is defined as:
-    .. math::
-        \text{ReLU}(x) = (x)^+ = \max(0, x)
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.ReLU()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    An implementation of CReLU - https://arxiv.org/abs/1603.05201
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> import jax.numpy as jnp
-        >>> m = nn.ReLU()
-        >>> x = brainstate.random.randn(2).unsqueeze(0)
-        >>> output = jnp.concat((m(x), m(-x)))
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.relu(x)
-    def __repr__(self):
-        return f'{self.__class__.__name__}()'
-class RReLU(ElementWiseBlock):
-    r"""Applies the randomized leaky rectified liner unit function, element-wise.
-    As described in the paper `Empirical Evaluation of Rectified Activations in
-    Convolutional Network`_.
-    The function is defined as:
-    .. math::
-        \text{RReLU}(x) =
-        \begin{cases}
-            x & \text{if } x \geq 0 \\
-            ax & \text{ otherwise }
-        \end{cases}
-    where :math:`a` is randomly sampled from uniform distribution
-    :math:`\mathcal{U}(\text{lower}, \text{upper})`.
-    Parameters
-    ----------
-    lower : float, optional
-        Lower bound of the uniform distribution. Default: :math:`\frac{1}{8}`
-    upper : float, optional
-        Upper bound of the uniform distribution. Default: :math:`\frac{1}{3}`
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    References
-    ----------
-    .. _`Empirical Evaluation of Rectified Activations in Convolutional Network`:
-        https://arxiv.org/abs/1505.00853
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.RReLU(0.1, 0.3)
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    lower: float
-    upper: float
-    def __init__(
-        self,
-        lower: float = 1. / 8,
-        upper: float = 1. / 3,
-    ):
-        super().__init__()
-        self.lower = lower
-        self.upper = upper
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.rrelu(x, self.lower, self.upper)
-    def extra_repr(self):
-        return f'{self.__class__.__name__}(lower={self.lower}, upper={self.upper})'
-class Hardtanh(ElementWiseBlock):
-    r"""Applies the HardTanh function element-wise.
-    HardTanh is defined as:
-    .. math::
-        \text{HardTanh}(x) = \begin{cases}
-            \text{max\_val} & \text{ if } x > \text{ max\_val } \\
-            \text{min\_val} & \text{ if } x < \text{ min\_val } \\
-            x & \text{ otherwise } \\
-        \end{cases}
-    Parameters
-    ----------
-    min_val : float, optional
-        Minimum value of the linear region range. Default: -1
-    max_val : float, optional
-        Maximum value of the linear region range. Default: 1
-    Notes
-    -----
-    Keyword arguments :attr:`min_value` and :attr:`max_value`
-    have been deprecated in favor of :attr:`min_val` and :attr:`max_val`.
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Hardtanh(-2, 2)
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    min_val: float
-    max_val: float
-    def __init__(
-        self,
-        min_val: float = -1.,
-        max_val: float = 1.,
-    ) -> None:
-        super().__init__()
-        self.min_val = min_val
-        self.max_val = max_val
-        assert self.max_val > self.min_val
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.hard_tanh(x, self.min_val, self.max_val)
-    def extra_repr(self) -> str:
-        return f'{self.__class__.__name__}(min_val={self.min_val}, max_val={self.max_val})'
-class ReLU6(Hardtanh):
-    r"""Applies the element-wise function.
-    ReLU6 is defined as:
-    .. math::
-        \text{ReLU6}(x) = \min(\max(0,x), 6)
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.ReLU6()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __init__(self):
-        super().__init__(0., 6.)
-class Sigmoid(ElementWiseBlock):
-    r"""Applies the element-wise function.
-    Sigmoid is defined as:
-    .. math::
-        \text{Sigmoid}(x) = \sigma(x) = \frac{1}{1 + \exp(-x)}
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Sigmoid()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.sigmoid(x)
-class Hardsigmoid(ElementWiseBlock):
-    r"""Applies the Hardsigmoid function element-wise.
-    Hardsigmoid is defined as:
-    .. math::
-        \text{Hardsigmoid}(x) = \begin{cases}
-            0 & \text{if~} x \le -3, \\
-            1 & \text{if~} x \ge +3, \\
-            x / 6 + 1 / 2 & \text{otherwise}
-        \end{cases}
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Hardsigmoid()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.hard_sigmoid(x)
-class Tanh(ElementWiseBlock):
-    r"""Applies the Hyperbolic Tangent (Tanh) function element-wise.
-    Tanh is defined as:
-    .. math::
-        \text{Tanh}(x) = \tanh(x) = \frac{\exp(x) - \exp(-x)} {\exp(x) + \exp(-x)}
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Tanh()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.tanh(x)
-class SiLU(ElementWiseBlock):
-    r"""Applies the Sigmoid Linear Unit (SiLU) function, element-wise.
-    The SiLU function is also known as the swish function.
-    .. math::
-        \text{silu}(x) = x * \sigma(x), \text{where } \sigma(x) \text{ is the logistic sigmoid.}
-    Notes
-    -----
-    See `Gaussian Error Linear Units (GELUs) <https://arxiv.org/abs/1606.08415>`_
-    where the SiLU (Sigmoid Linear Unit) was originally coined, and see
-    `Sigmoid-Weighted Linear Units for Neural Network Function Approximation
-    in Reinforcement Learning <https://arxiv.org/abs/1702.03118>`_ and `Swish:
-    a Self-Gated Activation Function <https://arxiv.org/abs/1710.05941v1>`_
-    where the SiLU was experimented with later.
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.SiLU()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.silu(x)
-class Mish(ElementWiseBlock):
-    r"""Applies the Mish function, element-wise.
-    Mish: A Self Regularized Non-Monotonic Neural Activation Function.
-    .. math::
-        \text{Mish}(x) = x * \text{Tanh}(\text{Softplus}(x))
-    Notes
-    -----
-    See `Mish: A Self Regularized Non-Monotonic Neural Activation Function
-    <https://arxiv.org/abs/1908.08681>`_
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Mish()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.mish(x)
-class Hardswish(ElementWiseBlock):
-    r"""Applies the Hardswish function, element-wise.
-    As described in the paper `Searching for MobileNetV3
-    <https://arxiv.org/abs/1905.02244>`_.
-    Hardswish is defined as:
-    .. math::
-        \text{Hardswish}(x) = \begin{cases}
-            0 & \text{if~} x \le -3, \\
-            x & \text{if~} x \ge +3, \\
-            x \cdot (x + 3) /6 & \text{otherwise}
-        \end{cases}
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Hardswish()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.hard_swish(x)
-class ELU(ElementWiseBlock):
-    r"""Applies the Exponential Linear Unit (ELU) function, element-wise.
-    As described in the paper: `Fast and Accurate Deep Network Learning by
-    Exponential Linear Units (ELUs) <https://arxiv.org/abs/1511.07289>`__.
-    ELU is defined as:
-    .. math::
-        \text{ELU}(x) = \begin{cases}
-        x, & \text{ if } x > 0\\
-        \alpha * (\exp(x) - 1), & \text{ if } x \leq 0
-        \end{cases}
-    Parameters
-    ----------
-    alpha : float, optional
-        The :math:`\alpha` value for the ELU formulation. Default: 1.0
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.ELU()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    alpha: float
-    def __init__(self, alpha: float = 1.) -> None:
-        super().__init__()
-        self.alpha = alpha
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.elu(x, self.alpha)
-    def extra_repr(self) -> str:
-        return f'{self.__class__.__name__}(alpha={self.alpha})'
-class CELU(ElementWiseBlock):
-    r"""Applies the element-wise function.
-    .. math::
-        \text{CELU}(x) = \max(0,x) + \min(0, \alpha * (\exp(x/\alpha) - 1))
-    More details can be found in the paper `Continuously Differentiable Exponential
-    Linear Units`_ .
-    Parameters
-    ----------
-    alpha : float, optional
-        The :math:`\alpha` value for the CELU formulation. Default: 1.0
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    References
-    ----------
-    .. _`Continuously Differentiable Exponential Linear Units`:
-        https://arxiv.org/abs/1704.07483
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.CELU()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    alpha: float
-    def __init__(self, alpha: float = 1.) -> None:
-        super().__init__()
-        self.alpha = alpha
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.celu(x, self.alpha)
-    def extra_repr(self) -> str:
-        return f'{self.__class__.__name__}(alpha={self.alpha})'
-class SELU(ElementWiseBlock):
-    r"""Applied element-wise.
-    .. math::
-        \text{SELU}(x) = \text{scale} * (\max(0,x) + \min(0, \alpha * (\exp(x) - 1)))
-    with :math:`\alpha = 1.6732632423543772848170429916717` and
-    :math:`\text{scale} = 1.0507009873554804934193349852946`.
-    More details can be found in the paper `Self-Normalizing Neural Networks`_ .
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    References
-    ----------
-    .. _Self-Normalizing Neural Networks: https://arxiv.org/abs/1706.02515
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.SELU()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.selu(x)
-class GLU(ElementWiseBlock):
-    r"""Applies the gated linear unit function.
-    .. math::
-        {GLU}(a, b)= a \otimes \sigma(b)
-    where :math:`a` is the first half of the input matrices and :math:`b` is
-    the second half.
-    Parameters
-    ----------
-    dim : int, optional
-        The dimension on which to split the input. Default: -1
-    Shape
-    -----
-    - Input: :math:`(\ast_1, N, \ast_2)` where `*` means, any number of additional
-      dimensions
-    - Output: :math:`(\ast_1, M, \ast_2)` where :math:`M=N/2`
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.GLU()
-        >>> x = brainstate.random.randn(4, 2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    dim: int
-    def __init__(self, dim: int = -1) -> None:
-        super().__init__()
-        self.dim = dim
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.glu(x, self.dim)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(dim={self.dim})'
-class GELU(ElementWiseBlock):
-    r"""Applies the Gaussian Error Linear Units function.
-    .. math:: \text{GELU}(x) = x * \Phi(x)
-    where :math:`\Phi(x)` is the Cumulative Distribution Function for Gaussian
-    Distribution.
-    When the approximate argument is True, Gelu is estimated with:
-    .. math:: \text{GELU}(x) = 0.5 * x * (1 + \text{Tanh}(\sqrt(2 / \pi) * (x + 0.044715 * x^3)))
-    Parameters
-    ----------
-    approximate : bool, optional
-        Whether to use the tanh approximation algorithm. Default: False
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.GELU()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    approximate: bool
-    def __init__(self, approximate: bool = False) -> None:
-        super().__init__()
-        self.approximate = approximate
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.gelu(x, approximate=self.approximate)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(approximate={self.approximate})'
-class Hardshrink(ElementWiseBlock):
-    r"""Applies the Hard Shrinkage (Hardshrink) function element-wise.
-    Hardshrink is defined as:
-    .. math::
-        \text{HardShrink}(x) =
-        \begin{cases}
-        x, & \text{ if } x > \lambda \\
-        x, & \text{ if } x < -\lambda \\
-        0, & \text{ otherwise }
-        \end{cases}
-    Parameters
-    ----------
-    lambd : float, optional
-        The :math:`\lambda` value for the Hardshrink formulation. Default: 0.5
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Hardshrink()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    lambd: float
-    def __init__(self, lambd: float = 0.5) -> None:
-        super().__init__()
-        self.lambd = lambd
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.hard_shrink(x, self.lambd)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(lambd={self.lambd})'
-class LeakyReLU(ElementWiseBlock):
-    r"""Applies the element-wise function.
-    .. math::
-        \text{LeakyReLU}(x) = \max(0, x) + \text{negative\_slope} * \min(0, x)
-    or
-    .. math::
-        \text{LeakyReLU}(x) =
-        \begin{cases}
-        x, & \text{ if } x \geq 0 \\
-        \text{negative\_slope} \times x, & \text{ otherwise }
-        \end{cases}
-    Parameters
-    ----------
-    negative_slope : float, optional
-        Controls the angle of the negative slope (which is used for
-        negative input values). Default: 1e-2
-    Shape
-    -----
-    - Input: :math:`(*)` where `*` means, any number of additional
-      dimensions
-    - Output: :math:`(*)`, same shape as the input
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.LeakyReLU(0.1)
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    negative_slope: float
-    def __init__(self, negative_slope: float = 1e-2) -> None:
-        super().__init__()
-        self.negative_slope = negative_slope
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.leaky_relu(x, self.negative_slope)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(negative_slope={self.negative_slope})'
-class LogSigmoid(ElementWiseBlock):
-    r"""Applies the element-wise function.
-    .. math::
-        \text{LogSigmoid}(x) = \log\left(\frac{ 1 }{ 1 + \exp(-x)}\right)
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.LogSigmoid()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.log_sigmoid(x)
-class Softplus(ElementWiseBlock):
-    r"""Applies the Softplus function element-wise.
-    .. math::
-        \text{Softplus}(x) = \frac{1}{\beta} * \log(1 + \exp(\beta * x))
-    SoftPlus is a smooth approximation to the ReLU function and can be used
-    to constrain the output of a machine to always be positive.
-    For numerical stability the implementation reverts to the linear function
-    when :math:`input \times \beta > threshold`.
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Softplus()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.softplus(x)
-class Softshrink(ElementWiseBlock):
-    r"""Applies the soft shrinkage function elementwise.
-    .. math::
-        \text{SoftShrinkage}(x) =
-        \begin{cases}
-        x - \lambda, & \text{ if } x > \lambda \\
-        x + \lambda, & \text{ if } x < -\lambda \\
-        0, & \text{ otherwise }
-        \end{cases}
-    Parameters
-    ----------
-    lambd : float, optional
-        The :math:`\lambda` (must be no less than zero) value for the
-        Softshrink formulation. Default: 0.5
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Softshrink()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    lambd: float
-    def __init__(self, lambd: float = 0.5) -> None:
-        super().__init__()
-        self.lambd = lambd
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.soft_shrink(x, self.lambd)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(lambd={self.lambd})'
-class PReLU(ElementWiseBlock):
-    r"""Applies the element-wise function.
-    .. math::
-        \text{PReLU}(x) = \max(0,x) + a * \min(0,x)
-    or
-    .. math::
-        \text{PReLU}(x) =
-        \begin{cases}
-        x, & \text{ if } x \geq 0 \\
-        ax, & \text{ otherwise }
-        \end{cases}
-    Here :math:`a` is a learnable parameter. When called without arguments,
-    `nn.PReLU()` uses a single parameter :math:`a` across all input channels.
-    If called with `nn.PReLU(nChannels)`, a separate :math:`a` is used for
-    each input channel.
-    Parameters
-    ----------
-    num_parameters : int, optional
-        Number of :math:`a` to learn. Although it takes an int as input,
-        there is only two values are legitimate: 1, or the number of channels
-        at input. Default: 1
-    init : float, optional
-        The initial value of :math:`a`. Default: 0.25
-    dtype : optional
-        The data type for the weight parameter.
-    Shape
-    -----
-    - Input: :math:`( *)` where `*` means, any number of additional dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Attributes
-    ----------
-    weight : Tensor
-        The learnable weights of shape (:attr:`num_parameters`).
-    Notes
-    -----
-    - Weight decay should not be used when learning :math:`a` for good performance.
-    - Channel dim is the 2nd dim of input. When input has dims < 2, then there is
-      no channel dim and the number of channels = 1.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate
-        >>> m = brainstate.nn.PReLU()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    num_parameters: int
-    def __init__(self, num_parameters: int = 1, init: float = 0.25, dtype=None) -> None:
-        super().__init__()
-        self.num_parameters = num_parameters
-        self.weight = ParamState(jnp.ones(num_parameters, dtype=dtype) * init)
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.prelu(x, self.weight.value)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(num_parameters={self.num_parameters})'
-class Softsign(ElementWiseBlock):
-    r"""Applies the element-wise function.
-    .. math::
-        \text{SoftSign}(x) = \frac{x}{ 1 + |x|}
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Softsign()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.soft_sign(x)
-class Tanhshrink(ElementWiseBlock):
-    r"""Applies the element-wise function.
-    .. math::
-        \text{Tanhshrink}(x) = x - \tanh(x)
-    Shape
-    -----
-    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
-    - Output: :math:`(*)`, same shape as the input.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Tanhshrink()
-        >>> x = brainstate.random.randn(2)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.tanh_shrink(x)
-class Softmin(ElementWiseBlock):
-    r"""Applies the Softmin function to an n-dimensional input Tensor.
-    Rescales the input so that the elements of the n-dimensional output Tensor
-    lie in the range `[0, 1]` and sum to 1.
-    Softmin is defined as:
-    .. math::
-        \text{Softmin}(x_{i}) = \frac{\exp(-x_i)}{\sum_j \exp(-x_j)}
-    Parameters
-    ----------
-    dim : int, optional
-        A dimension along which Softmin will be computed (so every slice
-        along dim will sum to 1).
-    Shape
-    -----
-    - Input: :math:`(*)` where `*` means, any number of additional dimensions
-    - Output: :math:`(*)`, same shape as the input
-    Returns
-    -------
-    Tensor
-        A Tensor of the same dimension and shape as the input, with
-        values in the range [0, 1]
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Softmin(dim=1)
-        >>> x = brainstate.random.randn(2, 3)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    dim: Optional[int]
-    def __init__(self, dim: Optional[int] = None) -> None:
-        super().__init__()
-        self.dim = dim
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.softmin(x, self.dim)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(dim={self.dim})'
-class Softmax(ElementWiseBlock):
-    r"""Applies the Softmax function to an n-dimensional input Tensor.
-    Rescales the input so that the elements of the n-dimensional output Tensor
-    lie in the range [0,1] and sum to 1.
-    Softmax is defined as:
-    .. math::
-        \text{Softmax}(x_{i}) = \frac{\exp(x_i)}{\sum_j \exp(x_j)}
-    When the input Tensor is a sparse tensor then the unspecified
-    values are treated as ``-inf``.
-    Parameters
-    ----------
-    dim : int, optional
-        A dimension along which Softmax will be computed (so every slice
-        along dim will sum to 1).
-    Shape
-    -----
-    - Input: :math:`(*)` where `*` means, any number of additional dimensions
-    - Output: :math:`(*)`, same shape as the input
-    Returns
-    -------
-    Tensor
-        A Tensor of the same dimension and shape as the input with
-        values in the range [0, 1]
-    Notes
-    -----
-    This module doesn't work directly with NLLLoss, which expects the Log to be
-    computed between the Softmax and itself. Use `LogSoftmax` instead (it's
-    faster and has better numerical properties).
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Softmax(dim=1)
-        >>> x = brainstate.random.randn(2, 3)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    dim: Optional[int]
-    def __init__(self, dim: Optional[int] = None) -> None:
-        super().__init__()
-        self.dim = dim
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.softmax(x, self.dim)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(dim={self.dim})'
-class Softmax2d(ElementWiseBlock):
-    r"""Applies SoftMax over features to each spatial location.
-    When given an image of ``Channels x Height x Width``, it will
-    apply `Softmax` to each location :math:`(Channels, h_i, w_j)`
-    Shape
-    -----
-    - Input: :math:`(N, C, H, W)` or :math:`(C, H, W)`.
-    - Output: :math:`(N, C, H, W)` or :math:`(C, H, W)` (same shape as input)
-    Returns
-    -------
-    Tensor
-        A Tensor of the same dimension and shape as the input with
-        values in the range [0, 1]
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.Softmax2d()
-        >>> # you softmax over the 2nd dimension
-        >>> x = brainstate.random.randn(2, 3, 12, 13)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        assert x.ndim == 4 or x.ndim == 3, 'Softmax2d requires a 3D or 4D tensor as input'
-        return F.softmax(x, -3)
-class LogSoftmax(ElementWiseBlock):
-    r"""Applies the :math:`\log(\text{Softmax}(x))` function to an n-dimensional input Tensor.
-    The LogSoftmax formulation can be simplified as:
-    .. math::
-        \text{LogSoftmax}(x_{i}) = \log\left(\frac{\exp(x_i) }{ \sum_j \exp(x_j)} \right)
-    Parameters
-    ----------
-    dim : int, optional
-        A dimension along which LogSoftmax will be computed.
-    Shape
-    -----
-    - Input: :math:`(*)` where `*` means, any number of additional dimensions
-    - Output: :math:`(*)`, same shape as the input
-    Returns
-    -------
-    Tensor
-        A Tensor of the same dimension and shape as the input with
-        values in the range [-inf, 0)
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> import brainstate
-        >>> m = nn.LogSoftmax(dim=1)
-        >>> x = brainstate.random.randn(2, 3)
-        >>> output = m(x)
-    """
-    __module__ = 'brainstate.nn'
-    dim: Optional[int]
-    def __init__(self, dim: Optional[int] = None) -> None:
-        super().__init__()
-        self.dim = dim
-    def __call__(self, x: ArrayLike) -> ArrayLike:
-        return F.log_softmax(x, self.dim)
-    def __repr__(self):
-        return f'{self.__class__.__name__}(dim={self.dim})'
-class Identity(ElementWiseBlock):
-    r"""A placeholder identity operator that is argument-insensitive.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> m = nn.Identity()
-        >>> x = brainstate.random.randn(2, 3)
-        >>> output = m(x)
-        >>> assert (output == x).all()
-    """
-    __module__ = 'brainstate.nn'
-    def __call__(self, x):
-        return x
-class SpikeBitwise(ElementWiseBlock):
-    r"""Bitwise addition for the spiking inputs.
-    .. math::
-       \begin{array}{ccc}
-        \hline \text { Mode } & \text { Expression for } \mathrm{g}(\mathrm{x}, \mathrm{y}) & \text { Code for } \mathrm{g}(\mathrm{x}, \mathrm{y}) \\
-        \hline \text { ADD } & x+y & x+y \\
-        \text { AND } & x \cap y & x \cdot y \\
-        \text { IAND } & (\neg x) \cap y & (1-x) \cdot y \\
-        \text { OR } & x \cup y & (x+y)-(x \cdot y) \\
-        \hline
-        \end{array}
-    Parameters
-    ----------
-    op : str, optional
-        The bitwise operation. Default: 'add'
-    name : str, optional
-        The name of the dynamic system.
-    Examples
-    --------
-    .. code-block:: python
-        >>> import brainstate.nn as nn
-        >>> m = nn.SpikeBitwise(op='and')
-        >>> x = brainstate.random.randn(2, 3) > 0
-        >>> y = brainstate.random.randn(2, 3) > 0
-        >>> output = m(x, y)
-    """
-    __module__ = 'brainstate.nn'
-    def __init__(
-        self,
-        op: str = 'add',
-        name: Optional[str] = None
-    ) -> None:
-        super().__init__(name=name)
-        self.op = op
-    def __call__(self, x, y):
-        import braintools
-        return braintools.spike_bitwise(x, y, self.op)
+# Copyright 2024 BrainX Ecosystem Limited. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+# -*- coding: utf-8 -*-
+from typing import Optional
+import brainunit as u
+import jax.numpy as jnp
+from brainstate._state import ParamState
+from brainstate.typing import ArrayLike
+from . import _activations as F
+from ._module import ElementWiseBlock
+__all__ = [
+    # activation functions
+    'Threshold', 'ReLU', 'RReLU', 'Hardtanh', 'ReLU6', 'Sigmoid', 'Hardsigmoid',
+    'Tanh', 'SiLU', 'Mish', 'Hardswish', 'ELU', 'CELU', 'SELU', 'GLU', 'GELU',
+    'Hardshrink', 'LeakyReLU', 'LogSigmoid', 'Softplus', 'Softshrink', 'PReLU',
+    'Softsign', 'Tanhshrink', 'Softmin', 'Softmax', 'Softmax2d', 'LogSoftmax',
+    # others
+    'Identity', 'SpikeBitwise',
+]
+class Threshold(ElementWiseBlock):
+    r"""Thresholds each element of the input Tensor.
+    Threshold is defined as:
+    .. math::
+        y =
+        \begin{cases}
+        x, &\text{ if } x > \text{threshold} \\
+        \text{value}, &\text{ otherwise }
+        \end{cases}
+    Parameters
+    ----------
+    threshold : float
+        The value to threshold at.
+    value : float
+        The value to replace with.
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Threshold(0.1, 20)
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    threshold: float
+    value: float
+    def __init__(self, threshold: float, value: float) -> None:
+        super().__init__()
+        self.threshold = threshold
+        self.value = value
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        dtype = u.math.get_dtype(x)
+        return jnp.where(x > jnp.asarray(self.threshold, dtype=dtype),
+                         x,
+                         jnp.asarray(self.value, dtype=dtype))
+    def __repr__(self):
+        return f'{self.__class__.__name__}(threshold={self.threshold}, value={self.value})'
+class ReLU(ElementWiseBlock):
+    r"""Applies the rectified linear unit function element-wise.
+    The ReLU function is defined as:
+    .. math::
+        \text{ReLU}(x) = (x)^+ = \max(0, x)
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.ReLU()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    An implementation of CReLU - https://arxiv.org/abs/1603.05201
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> import jax.numpy as jnp
+        >>> m = nn.ReLU()
+        >>> x = brainstate.random.randn(2).unsqueeze(0)
+        >>> output = jnp.concat((m(x), m(-x)))
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.relu(x)
+    def __repr__(self):
+        return f'{self.__class__.__name__}()'
+class RReLU(ElementWiseBlock):
+    r"""Applies the randomized leaky rectified liner unit function, element-wise.
+    As described in the paper `Empirical Evaluation of Rectified Activations in
+    Convolutional Network`_.
+    The function is defined as:
+    .. math::
+        \text{RReLU}(x) =
+        \begin{cases}
+            x & \text{if } x \geq 0 \\
+            ax & \text{ otherwise }
+        \end{cases}
+    where :math:`a` is randomly sampled from uniform distribution
+    :math:`\mathcal{U}(\text{lower}, \text{upper})`.
+    Parameters
+    ----------
+    lower : float, optional
+        Lower bound of the uniform distribution. Default: :math:`\frac{1}{8}`
+    upper : float, optional
+        Upper bound of the uniform distribution. Default: :math:`\frac{1}{3}`
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    References
+    ----------
+    .. _`Empirical Evaluation of Rectified Activations in Convolutional Network`:
+        https://arxiv.org/abs/1505.00853
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.RReLU(0.1, 0.3)
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    lower: float
+    upper: float
+    def __init__(
+        self,
+        lower: float = 1. / 8,
+        upper: float = 1. / 3,
+    ):
+        super().__init__()
+        self.lower = lower
+        self.upper = upper
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.rrelu(x, self.lower, self.upper)
+    def extra_repr(self):
+        return f'{self.__class__.__name__}(lower={self.lower}, upper={self.upper})'
+class Hardtanh(ElementWiseBlock):
+    r"""Applies the HardTanh function element-wise.
+    HardTanh is defined as:
+    .. math::
+        \text{HardTanh}(x) = \begin{cases}
+            \text{max\_val} & \text{ if } x > \text{ max\_val } \\
+            \text{min\_val} & \text{ if } x < \text{ min\_val } \\
+            x & \text{ otherwise } \\
+        \end{cases}
+    Parameters
+    ----------
+    min_val : float, optional
+        Minimum value of the linear region range. Default: -1
+    max_val : float, optional
+        Maximum value of the linear region range. Default: 1
+    Notes
+    -----
+    Keyword arguments :attr:`min_value` and :attr:`max_value`
+    have been deprecated in favor of :attr:`min_val` and :attr:`max_val`.
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Hardtanh(-2, 2)
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    min_val: float
+    max_val: float
+    def __init__(
+        self,
+        min_val: float = -1.,
+        max_val: float = 1.,
+    ) -> None:
+        super().__init__()
+        self.min_val = min_val
+        self.max_val = max_val
+        assert self.max_val > self.min_val
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.hard_tanh(x, self.min_val, self.max_val)
+    def extra_repr(self) -> str:
+        return f'{self.__class__.__name__}(min_val={self.min_val}, max_val={self.max_val})'
+class ReLU6(Hardtanh):
+    r"""Applies the element-wise function.
+    ReLU6 is defined as:
+    .. math::
+        \text{ReLU6}(x) = \min(\max(0,x), 6)
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.ReLU6()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __init__(self):
+        super().__init__(0., 6.)
+class Sigmoid(ElementWiseBlock):
+    r"""Applies the element-wise function.
+    Sigmoid is defined as:
+    .. math::
+        \text{Sigmoid}(x) = \sigma(x) = \frac{1}{1 + \exp(-x)}
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Sigmoid()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.sigmoid(x)
+class Hardsigmoid(ElementWiseBlock):
+    r"""Applies the Hardsigmoid function element-wise.
+    Hardsigmoid is defined as:
+    .. math::
+        \text{Hardsigmoid}(x) = \begin{cases}
+            0 & \text{if~} x \le -3, \\
+            1 & \text{if~} x \ge +3, \\
+            x / 6 + 1 / 2 & \text{otherwise}
+        \end{cases}
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Hardsigmoid()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.hard_sigmoid(x)
+class Tanh(ElementWiseBlock):
+    r"""Applies the Hyperbolic Tangent (Tanh) function element-wise.
+    Tanh is defined as:
+    .. math::
+        \text{Tanh}(x) = \tanh(x) = \frac{\exp(x) - \exp(-x)} {\exp(x) + \exp(-x)}
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Tanh()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.tanh(x)
+class SiLU(ElementWiseBlock):
+    r"""Applies the Sigmoid Linear Unit (SiLU) function, element-wise.
+    The SiLU function is also known as the swish function.
+    .. math::
+        \text{silu}(x) = x * \sigma(x), \text{where } \sigma(x) \text{ is the logistic sigmoid.}
+    Notes
+    -----
+    See `Gaussian Error Linear Units (GELUs) <https://arxiv.org/abs/1606.08415>`_
+    where the SiLU (Sigmoid Linear Unit) was originally coined, and see
+    `Sigmoid-Weighted Linear Units for Neural Network Function Approximation
+    in Reinforcement Learning <https://arxiv.org/abs/1702.03118>`_ and `Swish:
+    a Self-Gated Activation Function <https://arxiv.org/abs/1710.05941v1>`_
+    where the SiLU was experimented with later.
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.SiLU()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.silu(x)
+class Mish(ElementWiseBlock):
+    r"""Applies the Mish function, element-wise.
+    Mish: A Self Regularized Non-Monotonic Neural Activation Function.
+    .. math::
+        \text{Mish}(x) = x * \text{Tanh}(\text{Softplus}(x))
+    Notes
+    -----
+    See `Mish: A Self Regularized Non-Monotonic Neural Activation Function
+    <https://arxiv.org/abs/1908.08681>`_
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Mish()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.mish(x)
+class Hardswish(ElementWiseBlock):
+    r"""Applies the Hardswish function, element-wise.
+    As described in the paper `Searching for MobileNetV3
+    <https://arxiv.org/abs/1905.02244>`_.
+    Hardswish is defined as:
+    .. math::
+        \text{Hardswish}(x) = \begin{cases}
+            0 & \text{if~} x \le -3, \\
+            x & \text{if~} x \ge +3, \\
+            x \cdot (x + 3) /6 & \text{otherwise}
+        \end{cases}
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Hardswish()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.hard_swish(x)
+class ELU(ElementWiseBlock):
+    r"""Applies the Exponential Linear Unit (ELU) function, element-wise.
+    As described in the paper: `Fast and Accurate Deep Network Learning by
+    Exponential Linear Units (ELUs) <https://arxiv.org/abs/1511.07289>`__.
+    ELU is defined as:
+    .. math::
+        \text{ELU}(x) = \begin{cases}
+        x, & \text{ if } x > 0\\
+        \alpha * (\exp(x) - 1), & \text{ if } x \leq 0
+        \end{cases}
+    Parameters
+    ----------
+    alpha : float, optional
+        The :math:`\alpha` value for the ELU formulation. Default: 1.0
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.ELU()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    alpha: float
+    def __init__(self, alpha: float = 1.) -> None:
+        super().__init__()
+        self.alpha = alpha
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.elu(x, self.alpha)
+    def extra_repr(self) -> str:
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
+class CELU(ElementWiseBlock):
+    r"""Applies the element-wise function.
+    .. math::
+        \text{CELU}(x) = \max(0,x) + \min(0, \alpha * (\exp(x/\alpha) - 1))
+    More details can be found in the paper `Continuously Differentiable Exponential
+    Linear Units`_ .
+    Parameters
+    ----------
+    alpha : float, optional
+        The :math:`\alpha` value for the CELU formulation. Default: 1.0
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    References
+    ----------
+    .. _`Continuously Differentiable Exponential Linear Units`:
+        https://arxiv.org/abs/1704.07483
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.CELU()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    alpha: float
+    def __init__(self, alpha: float = 1.) -> None:
+        super().__init__()
+        self.alpha = alpha
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.celu(x, self.alpha)
+    def extra_repr(self) -> str:
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
+class SELU(ElementWiseBlock):
+    r"""Applied element-wise.
+    .. math::
+        \text{SELU}(x) = \text{scale} * (\max(0,x) + \min(0, \alpha * (\exp(x) - 1)))
+    with :math:`\alpha = 1.6732632423543772848170429916717` and
+    :math:`\text{scale} = 1.0507009873554804934193349852946`.
+    More details can be found in the paper `Self-Normalizing Neural Networks`_ .
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    References
+    ----------
+    .. _Self-Normalizing Neural Networks: https://arxiv.org/abs/1706.02515
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.SELU()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.selu(x)
+class GLU(ElementWiseBlock):
+    r"""Applies the gated linear unit function.
+    .. math::
+        {GLU}(a, b)= a \otimes \sigma(b)
+    where :math:`a` is the first half of the input matrices and :math:`b` is
+    the second half.
+    Parameters
+    ----------
+    dim : int, optional
+        The dimension on which to split the input. Default: -1
+    Shape
+    -----
+    - Input: :math:`(\ast_1, N, \ast_2)` where `*` means, any number of additional
+      dimensions
+    - Output: :math:`(\ast_1, M, \ast_2)` where :math:`M=N/2`
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.GLU()
+        >>> x = brainstate.random.randn(4, 2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    dim: int
+    def __init__(self, dim: int = -1) -> None:
+        super().__init__()
+        self.dim = dim
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.glu(x, self.dim)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(dim={self.dim})'
+class GELU(ElementWiseBlock):
+    r"""Applies the Gaussian Error Linear Units function.
+    .. math:: \text{GELU}(x) = x * \Phi(x)
+    where :math:`\Phi(x)` is the Cumulative Distribution Function for Gaussian
+    Distribution.
+    When the approximate argument is True, Gelu is estimated with:
+    .. math:: \text{GELU}(x) = 0.5 * x * (1 + \text{Tanh}(\sqrt(2 / \pi) * (x + 0.044715 * x^3)))
+    Parameters
+    ----------
+    approximate : bool, optional
+        Whether to use the tanh approximation algorithm. Default: False
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.GELU()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    approximate: bool
+    def __init__(self, approximate: bool = False) -> None:
+        super().__init__()
+        self.approximate = approximate
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.gelu(x, approximate=self.approximate)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(approximate={self.approximate})'
+class Hardshrink(ElementWiseBlock):
+    r"""Applies the Hard Shrinkage (Hardshrink) function element-wise.
+    Hardshrink is defined as:
+    .. math::
+        \text{HardShrink}(x) =
+        \begin{cases}
+        x, & \text{ if } x > \lambda \\
+        x, & \text{ if } x < -\lambda \\
+        0, & \text{ otherwise }
+        \end{cases}
+    Parameters
+    ----------
+    lambd : float, optional
+        The :math:`\lambda` value for the Hardshrink formulation. Default: 0.5
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Hardshrink()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    lambd: float
+    def __init__(self, lambd: float = 0.5) -> None:
+        super().__init__()
+        self.lambd = lambd
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.hard_shrink(x, self.lambd)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(lambd={self.lambd})'
+class LeakyReLU(ElementWiseBlock):
+    r"""Applies the element-wise function.
+    .. math::
+        \text{LeakyReLU}(x) = \max(0, x) + \text{negative\_slope} * \min(0, x)
+    or
+    .. math::
+        \text{LeakyReLU}(x) =
+        \begin{cases}
+        x, & \text{ if } x \geq 0 \\
+        \text{negative\_slope} \times x, & \text{ otherwise }
+        \end{cases}
+    Parameters
+    ----------
+    negative_slope : float, optional
+        Controls the angle of the negative slope (which is used for
+        negative input values). Default: 1e-2
+    Shape
+    -----
+    - Input: :math:`(*)` where `*` means, any number of additional
+      dimensions
+    - Output: :math:`(*)`, same shape as the input
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.LeakyReLU(0.1)
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    negative_slope: float
+    def __init__(self, negative_slope: float = 1e-2) -> None:
+        super().__init__()
+        self.negative_slope = negative_slope
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.leaky_relu(x, self.negative_slope)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(negative_slope={self.negative_slope})'
+class LogSigmoid(ElementWiseBlock):
+    r"""Applies the element-wise function.
+    .. math::
+        \text{LogSigmoid}(x) = \log\left(\frac{ 1 }{ 1 + \exp(-x)}\right)
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.LogSigmoid()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.log_sigmoid(x)
+class Softplus(ElementWiseBlock):
+    r"""Applies the Softplus function element-wise.
+    .. math::
+        \text{Softplus}(x) = \frac{1}{\beta} * \log(1 + \exp(\beta * x))
+    SoftPlus is a smooth approximation to the ReLU function and can be used
+    to constrain the output of a machine to always be positive.
+    For numerical stability the implementation reverts to the linear function
+    when :math:`input \times \beta > threshold`.
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Softplus()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.softplus(x)
+class Softshrink(ElementWiseBlock):
+    r"""Applies the soft shrinkage function elementwise.
+    .. math::
+        \text{SoftShrinkage}(x) =
+        \begin{cases}
+        x - \lambda, & \text{ if } x > \lambda \\
+        x + \lambda, & \text{ if } x < -\lambda \\
+        0, & \text{ otherwise }
+        \end{cases}
+    Parameters
+    ----------
+    lambd : float, optional
+        The :math:`\lambda` (must be no less than zero) value for the
+        Softshrink formulation. Default: 0.5
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Softshrink()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    lambd: float
+    def __init__(self, lambd: float = 0.5) -> None:
+        super().__init__()
+        self.lambd = lambd
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.soft_shrink(x, self.lambd)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(lambd={self.lambd})'
+class PReLU(ElementWiseBlock):
+    r"""Applies the element-wise function.
+    .. math::
+        \text{PReLU}(x) = \max(0,x) + a * \min(0,x)
+    or
+    .. math::
+        \text{PReLU}(x) =
+        \begin{cases}
+        x, & \text{ if } x \geq 0 \\
+        ax, & \text{ otherwise }
+        \end{cases}
+    Here :math:`a` is a learnable parameter. When called without arguments,
+    `nn.PReLU()` uses a single parameter :math:`a` across all input channels.
+    If called with `nn.PReLU(nChannels)`, a separate :math:`a` is used for
+    each input channel.
+    Parameters
+    ----------
+    num_parameters : int, optional
+        Number of :math:`a` to learn. Although it takes an int as input,
+        there is only two values are legitimate: 1, or the number of channels
+        at input. Default: 1
+    init : float, optional
+        The initial value of :math:`a`. Default: 0.25
+    dtype : optional
+        The data type for the weight parameter.
+    Shape
+    -----
+    - Input: :math:`( *)` where `*` means, any number of additional dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Attributes
+    ----------
+    weight : Tensor
+        The learnable weights of shape (:attr:`num_parameters`).
+    Notes
+    -----
+    - Weight decay should not be used when learning :math:`a` for good performance.
+    - Channel dim is the 2nd dim of input. When input has dims < 2, then there is
+      no channel dim and the number of channels = 1.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> m = brainstate.nn.PReLU()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    num_parameters: int
+    def __init__(self, num_parameters: int = 1, init: float = 0.25, dtype=None) -> None:
+        super().__init__()
+        self.num_parameters = num_parameters
+        self.weight = ParamState(jnp.ones(num_parameters, dtype=dtype) * init)
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.prelu(x, self.weight.value)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(num_parameters={self.num_parameters})'
+class Softsign(ElementWiseBlock):
+    r"""Applies the element-wise function.
+    .. math::
+        \text{SoftSign}(x) = \frac{x}{ 1 + |x|}
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Softsign()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.soft_sign(x)
+class Tanhshrink(ElementWiseBlock):
+    r"""Applies the element-wise function.
+    .. math::
+        \text{Tanhshrink}(x) = x - \tanh(x)
+    Shape
+    -----
+    - Input: :math:`(*)`, where :math:`*` means any number of dimensions.
+    - Output: :math:`(*)`, same shape as the input.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Tanhshrink()
+        >>> x = brainstate.random.randn(2)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.tanh_shrink(x)
+class Softmin(ElementWiseBlock):
+    r"""Applies the Softmin function to an n-dimensional input Tensor.
+    Rescales the input so that the elements of the n-dimensional output Tensor
+    lie in the range `[0, 1]` and sum to 1.
+    Softmin is defined as:
+    .. math::
+        \text{Softmin}(x_{i}) = \frac{\exp(-x_i)}{\sum_j \exp(-x_j)}
+    Parameters
+    ----------
+    dim : int, optional
+        A dimension along which Softmin will be computed (so every slice
+        along dim will sum to 1).
+    Shape
+    -----
+    - Input: :math:`(*)` where `*` means, any number of additional dimensions
+    - Output: :math:`(*)`, same shape as the input
+    Returns
+    -------
+    Tensor
+        A Tensor of the same dimension and shape as the input, with
+        values in the range [0, 1]
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Softmin(dim=1)
+        >>> x = brainstate.random.randn(2, 3)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    dim: Optional[int]
+    def __init__(self, dim: Optional[int] = None) -> None:
+        super().__init__()
+        self.dim = dim
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.softmin(x, self.dim)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(dim={self.dim})'
+class Softmax(ElementWiseBlock):
+    r"""Applies the Softmax function to an n-dimensional input Tensor.
+    Rescales the input so that the elements of the n-dimensional output Tensor
+    lie in the range [0,1] and sum to 1.
+    Softmax is defined as:
+    .. math::
+        \text{Softmax}(x_{i}) = \frac{\exp(x_i)}{\sum_j \exp(x_j)}
+    When the input Tensor is a sparse tensor then the unspecified
+    values are treated as ``-inf``.
+    Parameters
+    ----------
+    dim : int, optional
+        A dimension along which Softmax will be computed (so every slice
+        along dim will sum to 1).
+    Shape
+    -----
+    - Input: :math:`(*)` where `*` means, any number of additional dimensions
+    - Output: :math:`(*)`, same shape as the input
+    Returns
+    -------
+    Tensor
+        A Tensor of the same dimension and shape as the input with
+        values in the range [0, 1]
+    Notes
+    -----
+    This module doesn't work directly with NLLLoss, which expects the Log to be
+    computed between the Softmax and itself. Use `LogSoftmax` instead (it's
+    faster and has better numerical properties).
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Softmax(dim=1)
+        >>> x = brainstate.random.randn(2, 3)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    dim: Optional[int]
+    def __init__(self, dim: Optional[int] = None) -> None:
+        super().__init__()
+        self.dim = dim
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.softmax(x, self.dim)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(dim={self.dim})'
+class Softmax2d(ElementWiseBlock):
+    r"""Applies SoftMax over features to each spatial location.
+    When given an image of ``Channels x Height x Width``, it will
+    apply `Softmax` to each location :math:`(Channels, h_i, w_j)`
+    Shape
+    -----
+    - Input: :math:`(N, C, H, W)` or :math:`(C, H, W)`.
+    - Output: :math:`(N, C, H, W)` or :math:`(C, H, W)` (same shape as input)
+    Returns
+    -------
+    Tensor
+        A Tensor of the same dimension and shape as the input with
+        values in the range [0, 1]
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.Softmax2d()
+        >>> # you softmax over the 2nd dimension
+        >>> x = brainstate.random.randn(2, 3, 12, 13)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        assert x.ndim == 4 or x.ndim == 3, 'Softmax2d requires a 3D or 4D tensor as input'
+        return F.softmax(x, -3)
+class LogSoftmax(ElementWiseBlock):
+    r"""Applies the :math:`\log(\text{Softmax}(x))` function to an n-dimensional input Tensor.
+    The LogSoftmax formulation can be simplified as:
+    .. math::
+        \text{LogSoftmax}(x_{i}) = \log\left(\frac{\exp(x_i) }{ \sum_j \exp(x_j)} \right)
+    Parameters
+    ----------
+    dim : int, optional
+        A dimension along which LogSoftmax will be computed.
+    Shape
+    -----
+    - Input: :math:`(*)` where `*` means, any number of additional dimensions
+    - Output: :math:`(*)`, same shape as the input
+    Returns
+    -------
+    Tensor
+        A Tensor of the same dimension and shape as the input with
+        values in the range [-inf, 0)
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> import brainstate
+        >>> m = nn.LogSoftmax(dim=1)
+        >>> x = brainstate.random.randn(2, 3)
+        >>> output = m(x)
+    """
+    __module__ = 'brainstate.nn'
+    dim: Optional[int]
+    def __init__(self, dim: Optional[int] = None) -> None:
+        super().__init__()
+        self.dim = dim
+    def __call__(self, x: ArrayLike) -> ArrayLike:
+        return F.log_softmax(x, self.dim)
+    def __repr__(self):
+        return f'{self.__class__.__name__}(dim={self.dim})'
+class Identity(ElementWiseBlock):
+    r"""A placeholder identity operator that is argument-insensitive.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> m = nn.Identity()
+        >>> x = brainstate.random.randn(2, 3)
+        >>> output = m(x)
+        >>> assert (output == x).all()
+    """
+    __module__ = 'brainstate.nn'
+    def __call__(self, x):
+        return x
+class SpikeBitwise(ElementWiseBlock):
+    r"""Bitwise addition for the spiking inputs.
+    .. math::
+       \begin{array}{ccc}
+        \hline \text { Mode } & \text { Expression for } \mathrm{g}(\mathrm{x}, \mathrm{y}) & \text { Code for } \mathrm{g}(\mathrm{x}, \mathrm{y}) \\
+        \hline \text { ADD } & x+y & x+y \\
+        \text { AND } & x \cap y & x \cdot y \\
+        \text { IAND } & (\neg x) \cap y & (1-x) \cdot y \\
+        \text { OR } & x \cup y & (x+y)-(x \cdot y) \\
+        \hline
+        \end{array}
+    Parameters
+    ----------
+    op : str, optional
+        The bitwise operation. Default: 'add'
+    name : str, optional
+        The name of the dynamic system.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate.nn as nn
+        >>> m = nn.SpikeBitwise(op='and')
+        >>> x = brainstate.random.randn(2, 3) > 0
+        >>> y = brainstate.random.randn(2, 3) > 0
+        >>> output = m(x, y)
+    """
+    __module__ = 'brainstate.nn'
+    def __init__(
+        self,
+        op: str = 'add',
+        name: Optional[str] = None
+    ) -> None:
+        super().__init__(name=name)
+        self.op = op
+    def __call__(self, x, y):
+        import braintools
+        return braintools.spike_bitwise(x, y, self.op)

brainstate 0.2.1__py2.py3-none-any.whl → 0.2.2__py2.py3-none-any.whl

brainstate 0.2.1py2.py3-none-any.whl → 0.2.2py2.py3-none-any.whl