PyPI - brainstate - Versions diffs - 0.0.2.post20241010__py2.py3-none-any.whl → 0.1.0__py2.py3-none-any.whl - Mend

brainstate 0.0.2.post20241010py2.py3-none-any.whl → 0.1.0py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (175) hide show

brainstate/__init__.py +31 -11
brainstate/_state.py +760 -316
brainstate/_state_test.py +41 -12
brainstate/_utils.py +31 -4
brainstate/augment/__init__.py +40 -0
brainstate/augment/_autograd.py +608 -0
brainstate/augment/_autograd_test.py +1193 -0
brainstate/augment/_eval_shape.py +102 -0
brainstate/augment/_eval_shape_test.py +40 -0
brainstate/augment/_mapping.py +525 -0
brainstate/augment/_mapping_test.py +210 -0
brainstate/augment/_random.py +99 -0
brainstate/{transform → compile}/__init__.py +25 -13
brainstate/compile/_ad_checkpoint.py +204 -0
brainstate/compile/_ad_checkpoint_test.py +51 -0
brainstate/compile/_conditions.py +259 -0
brainstate/compile/_conditions_test.py +221 -0
brainstate/compile/_error_if.py +94 -0
brainstate/compile/_error_if_test.py +54 -0
brainstate/compile/_jit.py +314 -0
brainstate/compile/_jit_test.py +143 -0
brainstate/compile/_loop_collect_return.py +516 -0
brainstate/compile/_loop_collect_return_test.py +59 -0
brainstate/compile/_loop_no_collection.py +185 -0
brainstate/compile/_loop_no_collection_test.py +51 -0
brainstate/compile/_make_jaxpr.py +756 -0
brainstate/compile/_make_jaxpr_test.py +134 -0
brainstate/compile/_progress_bar.py +111 -0
brainstate/compile/_unvmap.py +159 -0
brainstate/compile/_util.py +147 -0
brainstate/environ.py +408 -381
brainstate/environ_test.py +34 -32
brainstate/{nn/event → event}/__init__.py +6 -6
brainstate/event/_csr.py +308 -0
brainstate/event/_csr_test.py +118 -0
brainstate/event/_fixed_probability.py +271 -0
brainstate/event/_fixed_probability_test.py +128 -0
brainstate/event/_linear.py +219 -0
brainstate/event/_linear_test.py +112 -0
brainstate/{nn/event → event}/_misc.py +7 -7
brainstate/functional/_activations.py +521 -511
brainstate/functional/_activations_test.py +300 -300
brainstate/functional/_normalization.py +43 -43
brainstate/functional/_others.py +15 -15
brainstate/functional/_spikes.py +49 -49
brainstate/graph/__init__.py +33 -0
brainstate/graph/_graph_context.py +443 -0
brainstate/graph/_graph_context_test.py +65 -0
brainstate/graph/_graph_convert.py +246 -0
brainstate/graph/_graph_node.py +300 -0
brainstate/graph/_graph_node_test.py +75 -0
brainstate/graph/_graph_operation.py +1746 -0
brainstate/graph/_graph_operation_test.py +724 -0
brainstate/init/_base.py +28 -10
brainstate/init/_generic.py +175 -172
brainstate/init/_random_inits.py +470 -415
brainstate/init/_random_inits_test.py +150 -0
brainstate/init/_regular_inits.py +66 -69
brainstate/init/_regular_inits_test.py +51 -0
brainstate/mixin.py +236 -244
brainstate/mixin_test.py +44 -46
brainstate/nn/__init__.py +26 -51
brainstate/nn/_collective_ops.py +199 -0
brainstate/nn/_dyn_impl/__init__.py +46 -0
brainstate/nn/_dyn_impl/_dynamics_neuron.py +290 -0
brainstate/nn/_dyn_impl/_dynamics_neuron_test.py +162 -0
brainstate/nn/_dyn_impl/_dynamics_synapse.py +320 -0
brainstate/nn/_dyn_impl/_dynamics_synapse_test.py +132 -0
brainstate/nn/_dyn_impl/_inputs.py +154 -0
brainstate/nn/{_projection/__init__.py → _dyn_impl/_projection_alignpost.py} +6 -13
brainstate/nn/_dyn_impl/_rate_rnns.py +400 -0
brainstate/nn/_dyn_impl/_rate_rnns_test.py +64 -0
brainstate/nn/_dyn_impl/_readout.py +128 -0
brainstate/nn/_dyn_impl/_readout_test.py +54 -0
brainstate/nn/_dynamics/__init__.py +37 -0
brainstate/nn/_dynamics/_dynamics_base.py +631 -0
brainstate/nn/_dynamics/_dynamics_base_test.py +79 -0
brainstate/nn/_dynamics/_projection_base.py +346 -0
brainstate/nn/_dynamics/_state_delay.py +453 -0
brainstate/nn/_dynamics/_synouts.py +161 -0
brainstate/nn/_dynamics/_synouts_test.py +58 -0
brainstate/nn/_elementwise/__init__.py +22 -0
brainstate/nn/_elementwise/_dropout.py +418 -0
brainstate/nn/_elementwise/_dropout_test.py +100 -0
brainstate/nn/_elementwise/_elementwise.py +1122 -0
brainstate/nn/_elementwise/_elementwise_test.py +171 -0
brainstate/nn/_exp_euler.py +97 -0
brainstate/nn/_exp_euler_test.py +36 -0
brainstate/nn/_interaction/__init__.py +32 -0
brainstate/nn/_interaction/_connections.py +726 -0
brainstate/nn/_interaction/_connections_test.py +254 -0
brainstate/nn/_interaction/_embedding.py +59 -0
brainstate/nn/_interaction/_normalizations.py +388 -0
brainstate/nn/_interaction/_normalizations_test.py +75 -0
brainstate/nn/_interaction/_poolings.py +1179 -0
brainstate/nn/_interaction/_poolings_test.py +219 -0
brainstate/nn/_module.py +328 -0
brainstate/nn/_module_test.py +211 -0
brainstate/nn/metrics.py +309 -309
brainstate/optim/__init__.py +14 -2
brainstate/optim/_base.py +66 -0
brainstate/optim/_lr_scheduler.py +363 -400
brainstate/optim/_lr_scheduler_test.py +25 -24
brainstate/optim/_optax_optimizer.py +103 -176
brainstate/optim/_optax_optimizer_test.py +41 -1
brainstate/optim/_sgd_optimizer.py +950 -1025
brainstate/random/_rand_funs.py +3269 -3268
brainstate/random/_rand_funs_test.py +568 -0
brainstate/random/_rand_seed.py +149 -117
brainstate/random/_rand_seed_test.py +50 -0
brainstate/random/_rand_state.py +1356 -1321
brainstate/random/_random_for_unit.py +13 -13
brainstate/surrogate.py +1262 -1243
brainstate/{nn/_projection/_utils.py → transform.py} +1 -2
brainstate/typing.py +157 -130
brainstate/util/__init__.py +52 -0
brainstate/util/_caller.py +100 -0
brainstate/util/_dict.py +734 -0
brainstate/util/_dict_test.py +160 -0
brainstate/util/_error.py +28 -0
brainstate/util/_filter.py +178 -0
brainstate/util/_others.py +497 -0
brainstate/util/_pretty_repr.py +208 -0
brainstate/util/_scaling.py +260 -0
brainstate/util/_struct.py +524 -0
brainstate/util/_tracers.py +75 -0
brainstate/{_visualization.py → util/_visualization.py} +16 -16
{brainstate-0.0.2.post20241010.dist-info → brainstate-0.1.0.dist-info}/METADATA +11 -11
brainstate-0.1.0.dist-info/RECORD +135 -0
brainstate/_module.py +0 -1637
brainstate/_module_test.py +0 -207
brainstate/nn/_base.py +0 -251
brainstate/nn/_connections.py +0 -686
brainstate/nn/_dynamics.py +0 -426
brainstate/nn/_elementwise.py +0 -1438
brainstate/nn/_embedding.py +0 -66
brainstate/nn/_misc.py +0 -133
brainstate/nn/_normalizations.py +0 -389
brainstate/nn/_others.py +0 -101
brainstate/nn/_poolings.py +0 -1229
brainstate/nn/_poolings_test.py +0 -231
brainstate/nn/_projection/_align_post.py +0 -546
brainstate/nn/_projection/_align_pre.py +0 -599
brainstate/nn/_projection/_delta.py +0 -241
brainstate/nn/_projection/_vanilla.py +0 -101
brainstate/nn/_rate_rnns.py +0 -410
brainstate/nn/_readout.py +0 -136
brainstate/nn/_synouts.py +0 -166
brainstate/nn/event/csr.py +0 -312
brainstate/nn/event/csr_test.py +0 -118
brainstate/nn/event/fixed_probability.py +0 -276
brainstate/nn/event/fixed_probability_test.py +0 -127
brainstate/nn/event/linear.py +0 -220
brainstate/nn/event/linear_test.py +0 -111
brainstate/random/random_test.py +0 -593
brainstate/transform/_autograd.py +0 -585
brainstate/transform/_autograd_test.py +0 -1181
brainstate/transform/_conditions.py +0 -334
brainstate/transform/_conditions_test.py +0 -220
brainstate/transform/_error_if.py +0 -94
brainstate/transform/_error_if_test.py +0 -55
brainstate/transform/_jit.py +0 -265
brainstate/transform/_jit_test.py +0 -118
brainstate/transform/_loop_collect_return.py +0 -502
brainstate/transform/_loop_no_collection.py +0 -170
brainstate/transform/_make_jaxpr.py +0 -739
brainstate/transform/_make_jaxpr_test.py +0 -131
brainstate/transform/_mapping.py +0 -109
brainstate/transform/_progress_bar.py +0 -111
brainstate/transform/_unvmap.py +0 -143
brainstate/util.py +0 -746
brainstate-0.0.2.post20241010.dist-info/RECORD +0 -87
{brainstate-0.0.2.post20241010.dist-info → brainstate-0.1.0.dist-info}/LICENSE +0 -0
{brainstate-0.0.2.post20241010.dist-info → brainstate-0.1.0.dist-info}/WHEEL +0 -0
{brainstate-0.0.2.post20241010.dist-info → brainstate-0.1.0.dist-info}/top_level.txt +0 -0

brainstate/surrogate.py CHANGED Viewed

@@ -14,6 +14,7 @@
 # ==============================================================================
 # -*- coding: utf-8 -*-
+from __future__ import annotations
 import jax
 import jax.numpy as jnp
@@ -22,65 +23,65 @@ from jax.core import Primitive
 from jax.interpreters import batching, ad, mlir
 __all__ = [
-  'Surrogate',
-  'Sigmoid',
-  'sigmoid',
-  'PiecewiseQuadratic',
-  'piecewise_quadratic',
-  'PiecewiseExp',
-  'piecewise_exp',
-  'SoftSign',
-  'soft_sign',
-  'Arctan',
-  'arctan',
-  'NonzeroSignLog',
-  'nonzero_sign_log',
-  'ERF',
-  'erf',
-  'PiecewiseLeakyRelu',
-  'piecewise_leaky_relu',
-  'SquarewaveFourierSeries',
-  'squarewave_fourier_series',
-  'S2NN',
-  's2nn',
-  'QPseudoSpike',
-  'q_pseudo_spike',
-  'LeakyRelu',
-  'leaky_relu',
-  'LogTailedRelu',
-  'log_tailed_relu',
-  'ReluGrad',
-  'relu_grad',
-  'GaussianGrad',
-  'gaussian_grad',
-  'InvSquareGrad',
-  'inv_square_grad',
-  'MultiGaussianGrad',
-  'multi_gaussian_grad',
-  'SlayerGrad',
-  'slayer_grad',
+    'Surrogate',
+    'Sigmoid',
+    'sigmoid',
+    'PiecewiseQuadratic',
+    'piecewise_quadratic',
+    'PiecewiseExp',
+    'piecewise_exp',
+    'SoftSign',
+    'soft_sign',
+    'Arctan',
+    'arctan',
+    'NonzeroSignLog',
+    'nonzero_sign_log',
+    'ERF',
+    'erf',
+    'PiecewiseLeakyRelu',
+    'piecewise_leaky_relu',
+    'SquarewaveFourierSeries',
+    'squarewave_fourier_series',
+    'S2NN',
+    's2nn',
+    'QPseudoSpike',
+    'q_pseudo_spike',
+    'LeakyRelu',
+    'leaky_relu',
+    'LogTailedRelu',
+    'log_tailed_relu',
+    'ReluGrad',
+    'relu_grad',
+    'GaussianGrad',
+    'gaussian_grad',
+    'InvSquareGrad',
+    'inv_square_grad',
+    'MultiGaussianGrad',
+    'multi_gaussian_grad',
+    'SlayerGrad',
+    'slayer_grad',
 ]
 def _heaviside_abstract(x, dx):
-  return [x]
+    return [x]
 def _heaviside_imp(x, dx):
-  z = jnp.asarray(x >= 0, dtype=x.dtype)
-  return [z]
+    z = jnp.asarray(x >= 0, dtype=x.dtype)
+    return [z]
 def _heaviside_batching(args, axes):
-  return heaviside_p.bind(*args), [axes[0]]
+    return heaviside_p.bind(*args), [axes[0]]
 def _heaviside_jvp(primals, tangents):
-  x, dx = primals
-  tx, tdx = tangents
-  primal_outs = heaviside_p.bind(x, dx)
-  tangent_outs = [dx * tx, ]
-  return primal_outs, tangent_outs
+    x, dx = primals
+    tx, tdx = tangents
+    primal_outs = heaviside_p.bind(x, dx)
+    tangent_outs = [dx * tx, ]
+    return primal_outs, tangent_outs
 heaviside_p = Primitive('heaviside_p')
@@ -93,260 +94,262 @@ mlir.register_lowering(heaviside_p, mlir.lower_fun(_heaviside_imp, multiple_resu
 class Surrogate(object):
-  """The base surrograte gradient function.
+    """The base surrograte gradient function.
-  To customize a surrogate gradient function, you can inherit this class and
-  implement the `surrogate_fun` and `surrogate_grad` methods.
+    To customize a surrogate gradient function, you can inherit this class and
+    implement the `surrogate_fun` and `surrogate_grad` methods.
-  Examples
-  --------
+    Examples
+    --------
-  >>> import brainstate as bst
-  >>> import brainstate.nn as nn
-  >>> import jax.numpy as jnp
+    >>> import brainstate as bst
+    >>> import brainstate.nn as nn
+    >>> import jax.numpy as jnp
-  >>> class MySurrogate(nn.surrogate.Surrogate):
-  ...   def __init__(self, alpha=1.):
-  ...     super().__init__()
-  ...     self.alpha = alpha
-  ...
-  ...   def surrogate_fun(self, x):
-  ...     return jnp.sin(x) * self.alpha
-  ...
-  ...   def surrogate_grad(self, x):
-  ...     return jnp.cos(x) * self.alpha
+    >>> class MySurrogate(bst.surrogate.Surrogate):
+    ...   def __init__(self, alpha=1.):
+    ...     super().__init__()
+    ...     self.alpha = alpha
+    ...
+    ...   def surrogate_fun(self, x):
+    ...     return jnp.sin(x) * self.alpha
+    ...
+    ...   def surrogate_grad(self, x):
+    ...     return jnp.cos(x) * self.alpha
-  """
+    """
-  def __call__(self, x):
-    dx = self.surrogate_grad(x)
-    return heaviside_p.bind(x, dx)[0]
+    def __call__(self, x):
+        dx = self.surrogate_grad(x)
+        return heaviside_p.bind(x, dx)[0]
-  def __repr__(self):
-    return f'{self.__class__.__name__}()'
+    def __repr__(self):
+        return f'{self.__class__.__name__}()'
-  def surrogate_fun(self, x) -> jax.Array:
-    """The surrogate function."""
-    raise NotImplementedError
+    def surrogate_fun(self, x) -> jax.Array:
+        """The surrogate function."""
+        raise NotImplementedError
-  def surrogate_grad(self, x) -> jax.Array:
-    """The gradient function of the surrogate function."""
-    raise NotImplementedError
+    def surrogate_grad(self, x) -> jax.Array:
+        """The gradient function of the surrogate function."""
+        raise NotImplementedError
 class Sigmoid(Surrogate):
-  """Spike function with the sigmoid-shaped surrogate gradient.
+    """Spike function with the sigmoid-shaped surrogate gradient.
-  See Also
-  --------
-  sigmoid
+    See Also
+    --------
+    sigmoid
-  """
+    """
-  def __init__(self, alpha: float = 4.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha: float = 4.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_fun(self, x):
-    return sci.special.expit(self.alpha * x)
+    def surrogate_fun(self, x):
+        return sci.special.expit(self.alpha * x)
-  def surrogate_grad(self, x):
-    sgax = sci.special.expit(x * self.alpha)
-    dx = (1. - sgax) * sgax * self.alpha
-    return dx
+    def surrogate_grad(self, x):
+        sgax = sci.special.expit(x * self.alpha)
+        dx = (1. - sgax) * sgax * self.alpha
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def sigmoid(
     x: jax.Array,
     alpha: float = 4.,
 ):
-  r"""Spike function with the sigmoid-shaped surrogate gradient.
+    r"""Spike function with the sigmoid-shaped surrogate gradient.
-  If `origin=False`, return the forward function:
+    If `origin=False`, return the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     g(x) = \mathrm{sigmoid}(\alpha x) = \frac{1}{1+e^{-\alpha x}}
+       g(x) = \mathrm{sigmoid}(\alpha x) = \frac{1}{1+e^{-\alpha x}}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \alpha * (1 - \mathrm{sigmoid} (\alpha x)) \mathrm{sigmoid} (\alpha x)
+       g'(x) = \alpha * (1 - \mathrm{sigmoid} (\alpha x)) \mathrm{sigmoid} (\alpha x)
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-2, 2, 1000)
-     >>> for alpha in [1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.sigmoid)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-2, 2, 1000)
+       >>> for alpha in [1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.sigmoid)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
-  """
-  return Sigmoid(alpha=alpha)(x)
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    """
+    return Sigmoid(alpha=alpha)(x)
 class PiecewiseQuadratic(Surrogate):
-  """Judge spiking state with a piecewise quadratic function.
+    """Judge spiking state with a piecewise quadratic function.
-  See Also
-  --------
-  piecewise_quadratic
+    See Also
+    --------
+    piecewise_quadratic
-  """
+    """
-  def __init__(self, alpha: float = 1.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha: float = 1.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_fun(self, x):
-    z = jnp.where(x < -1 / self.alpha,
-                  0.,
-                  jnp.where(x > 1 / self.alpha,
-                            1.,
-                            (-self.alpha * jnp.abs(x) / 2 + 1) * self.alpha * x + 0.5))
-    return z
+    def surrogate_fun(self, x):
+        z = jnp.where(x < -1 / self.alpha,
+                      0.,
+                      jnp.where(x > 1 / self.alpha,
+                                1.,
+                                (-self.alpha * jnp.abs(x) / 2 + 1) * self.alpha * x + 0.5))
+        return z
-  def surrogate_grad(self, x):
-    dx = jnp.where(jnp.abs(x) > 1 / self.alpha, 0., (-(self.alpha * x) ** 2 + self.alpha))
-    return dx
+    def surrogate_grad(self, x):
+        dx = jnp.where(jnp.abs(x) > 1 / self.alpha, 0., (-(self.alpha * x) ** 2 + self.alpha))
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def piecewise_quadratic(
     x: jax.Array,
     alpha: float = 1.,
 ):
-  r"""Judge spiking state with a piecewise quadratic function [1]_ [2]_ [3]_ [4]_ [5]_.
+    r"""Judge spiking state with a piecewise quadratic function [1]_ [2]_ [3]_ [4]_ [5]_.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     g(x) =
-        \begin{cases}
-        0, & x < -\frac{1}{\alpha} \\
-        -\frac{1}{2}\alpha^2|x|x + \alpha x + \frac{1}{2}, & |x| \leq \frac{1}{\alpha}  \\
-        1, & x > \frac{1}{\alpha} \\
-        \end{cases}
+       g(x) =
+          \begin{cases}
+          0, & x < -\frac{1}{\alpha} \\
+          -\frac{1}{2}\alpha^2|x|x + \alpha x + \frac{1}{2}, & |x| \leq \frac{1}{\alpha}  \\
+          1, & x > \frac{1}{\alpha} \\
+          \end{cases}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) =
-        \begin{cases}
-        0, & |x| > \frac{1}{\alpha} \\
-        -\alpha^2|x|+\alpha, & |x| \leq \frac{1}{\alpha}
-        \end{cases}
-  .. plot::
-     :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for alpha in [0.5, 1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.piecewise_quadratic)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
-  References
-  ----------
-  .. [1] Esser S K, Merolla P A, Arthur J V, et al. Convolutional networks for fast, energy-efficient neuromorphic computing[J]. Proceedings of the national academy of sciences, 2016, 113(41): 11441-11446.
-  .. [2] Wu Y, Deng L, Li G, et al. Spatio-temporal backpropagation for training high-performance spiking neural networks[J]. Frontiers in neuroscience, 2018, 12: 331.
-  .. [3] Bellec G, Salaj D, Subramoney A, et al. Long short-term memory and learning-to-learn in networks of spiking neurons[C]//Proceedings of the 32nd International Conference on Neural Information Processing Systems. 2018: 795-805.
-  .. [4] Neftci E O, Mostafa H, Zenke F. Surrogate gradient learning in spiking neural networks: Bringing the power of gradient-based optimization to spiking neural networks[J]. IEEE Signal Processing Magazine, 2019, 36(6): 51-63.
-  .. [5] Panda P, Aketi S A, Roy K. Toward scalable, efficient, and accurate deep spiking neural networks with backward residual connections, stochastic softmax, and hybridization[J]. Frontiers in Neuroscience, 2020, 14.
-  """
-  return PiecewiseQuadratic(alpha=alpha)(x)
+       g'(x) =
+          \begin{cases}
+          0, & |x| > \frac{1}{\alpha} \\
+          -\alpha^2|x|+\alpha, & |x| \leq \frac{1}{\alpha}
+          \end{cases}
+    .. plot::
+       :include-source: True
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for alpha in [0.5, 1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.piecewise_quadratic)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    References
+    ----------
+    .. [1] Esser S K, Merolla P A, Arthur J V, et al. Convolutional networks for fast, energy-efficient neuromorphic computing[J]. Proceedings of the national academy of sciences, 2016, 113(41): 11441-11446.
+    .. [2] Wu Y, Deng L, Li G, et al. Spatio-temporal backpropagation for training high-performance spiking neural networks[J]. Frontiers in neuroscience, 2018, 12: 331.
+    .. [3] Bellec G, Salaj D, Subramoney A, et al. Long short-term memory and learning-to-learn in networks of spiking neurons[C]//Proceedings of the 32nd International Conference on Neural Information Processing Systems. 2018: 795-805.
+    .. [4] Neftci E O, Mostafa H, Zenke F. Surrogate gradient learning in spiking neural networks: Bringing the power of gradient-based optimization to spiking neural networks[J]. IEEE Signal Processing Magazine, 2019, 36(6): 51-63.
+    .. [5] Panda P, Aketi S A, Roy K. Toward scalable, efficient, and accurate deep spiking neural networks with backward residual connections, stochastic softmax, and hybridization[J]. Frontiers in Neuroscience, 2020, 14.
+    """
+    return PiecewiseQuadratic(alpha=alpha)(x)
 class PiecewiseExp(Surrogate):
-  """Judge spiking state with a piecewise exponential function.
+    """Judge spiking state with a piecewise exponential function.
-  See Also
-  --------
-  piecewise_exp
-  """
+    See Also
+    --------
+    piecewise_exp
+    """
-  def __init__(self, alpha: float = 1.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha: float = 1.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = (self.alpha / 2) * jnp.exp(-self.alpha * jnp.abs(x))
-    return dx
+    def surrogate_grad(self, x):
+        dx = (self.alpha / 2) * jnp.exp(-self.alpha * jnp.abs(x))
+        return dx
-  def surrogate_fun(self, x):
-    return jnp.where(x < 0, jnp.exp(self.alpha * x) / 2, 1 - jnp.exp(-self.alpha * x) / 2)
+    def surrogate_fun(self, x):
+        return jnp.where(x < 0, jnp.exp(self.alpha * x) / 2, 1 - jnp.exp(-self.alpha * x) / 2)
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def piecewise_exp(
@@ -354,89 +357,90 @@ def piecewise_exp(
     alpha: float = 1.,
 ):
-  r"""Judge spiking state with a piecewise exponential function [1]_.
+    r"""Judge spiking state with a piecewise exponential function [1]_.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-            \frac{1}{2}e^{\alpha x}, & x < 0 \\
-            1 - \frac{1}{2}e^{-\alpha x}, & x \geq 0
-            \end{cases}
+       g(x) = \begin{cases}
+              \frac{1}{2}e^{\alpha x}, & x < 0 \\
+              1 - \frac{1}{2}e^{-\alpha x}, & x \geq 0
+              \end{cases}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \frac{\alpha}{2}e^{-\alpha |x|}
+       g'(x) = \frac{\alpha}{2}e^{-\alpha |x|}
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for alpha in [0.5, 1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.piecewise_exp)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for alpha in [0.5, 1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.piecewise_exp)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
-  References
-  ----------
-  .. [1] Neftci E O, Mostafa H, Zenke F. Surrogate gradient learning in spiking neural networks: Bringing the power of gradient-based optimization to spiking neural networks[J]. IEEE Signal Processing Magazine, 2019, 36(6): 51-63.
-  """
-  return PiecewiseExp(alpha=alpha)(x)
+    References
+    ----------
+    .. [1] Neftci E O, Mostafa H, Zenke F. Surrogate gradient learning in spiking neural networks: Bringing the power of gradient-based optimization to spiking neural networks[J]. IEEE Signal Processing Magazine, 2019, 36(6): 51-63.
+    """
+    return PiecewiseExp(alpha=alpha)(x)
 class SoftSign(Surrogate):
-  """Judge spiking state with a soft sign function.
+    """Judge spiking state with a soft sign function.
-  See Also
-  --------
-  soft_sign
-  """
+    See Also
+    --------
+    soft_sign
+    """
-  def __init__(self, alpha=1.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha=1.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = self.alpha * 0.5 / (1 + jnp.abs(self.alpha * x)) ** 2
-    return dx
+    def surrogate_grad(self, x):
+        dx = self.alpha * 0.5 / (1 + jnp.abs(self.alpha * x)) ** 2
+        return dx
-  def surrogate_fun(self, x):
-    return x / (2 / self.alpha + 2 * jnp.abs(x)) + 0.5
+    def surrogate_fun(self, x):
+        return x / (2 / self.alpha + 2 * jnp.abs(x)) + 0.5
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def soft_sign(
@@ -444,84 +448,85 @@ def soft_sign(
     alpha: float = 1.,
 ):
-  r"""Judge spiking state with a soft sign function.
+    r"""Judge spiking state with a soft sign function.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     g(x) = \frac{1}{2} (\frac{\alpha x}{1 + |\alpha x|} + 1)
-            = \frac{1}{2} (\frac{x}{\frac{1}{\alpha} + |x|} + 1)
+       g(x) = \frac{1}{2} (\frac{\alpha x}{1 + |\alpha x|} + 1)
+              = \frac{1}{2} (\frac{x}{\frac{1}{\alpha} + |x|} + 1)
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \frac{\alpha}{2(1 + |\alpha x|)^{2}} = \frac{1}{2\alpha(\frac{1}{\alpha} + |x|)^{2}}
+       g'(x) = \frac{\alpha}{2(1 + |\alpha x|)^{2}} = \frac{1}{2\alpha(\frac{1}{\alpha} + |x|)^{2}}
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for alpha in [0.5, 1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.soft_sign)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for alpha in [0.5, 1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.soft_sign)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
-  """
-  return SoftSign(alpha=alpha)(x)
+    """
+    return SoftSign(alpha=alpha)(x)
 class Arctan(Surrogate):
-  """Judge spiking state with an arctan function.
+    """Judge spiking state with an arctan function.
-  See Also
-  --------
-  arctan
-  """
+    See Also
+    --------
+    arctan
+    """
-  def __init__(self, alpha=1.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha=1.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = self.alpha * 0.5 / (1 + (jnp.pi / 2 * self.alpha * x) ** 2)
-    return dx
+    def surrogate_grad(self, x):
+        dx = self.alpha * 0.5 / (1 + (jnp.pi / 2 * self.alpha * x) ** 2)
+        return dx
-  def surrogate_fun(self, x):
-    return jnp.arctan2(jnp.pi / 2 * self.alpha * x) / jnp.pi + 0.5
+    def surrogate_fun(self, x):
+        return jnp.arctan2(jnp.pi / 2 * self.alpha * x) / jnp.pi + 0.5
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def arctan(
@@ -529,83 +534,84 @@ def arctan(
     alpha: float = 1.,
 ):
-  r"""Judge spiking state with an arctan function.
+    r"""Judge spiking state with an arctan function.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     g(x) = \frac{1}{\pi} \arctan(\frac{\pi}{2}\alpha x) + \frac{1}{2}
+       g(x) = \frac{1}{\pi} \arctan(\frac{\pi}{2}\alpha x) + \frac{1}{2}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \frac{\alpha}{2(1 + (\frac{\pi}{2}\alpha x)^2)}
+       g'(x) = \frac{\alpha}{2(1 + (\frac{\pi}{2}\alpha x)^2)}
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for alpha in [0.5, 1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.arctan)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for alpha in [0.5, 1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.arctan)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
-  """
-  return Arctan(alpha=alpha)(x)
+    """
+    return Arctan(alpha=alpha)(x)
 class NonzeroSignLog(Surrogate):
-  """Judge spiking state with a nonzero sign log function.
+    """Judge spiking state with a nonzero sign log function.
-  See Also
-  --------
-  nonzero_sign_log
-  """
+    See Also
+    --------
+    nonzero_sign_log
+    """
-  def __init__(self, alpha=1.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha=1.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = 1. / (1 / self.alpha + jnp.abs(x))
-    return dx
+    def surrogate_grad(self, x):
+        dx = 1. / (1 / self.alpha + jnp.abs(x))
+        return dx
-  def surrogate_fun(self, x):
-    return jnp.where(x < 0, -1., 1.) * jnp.log(jnp.abs(self.alpha * x) + 1)
+    def surrogate_fun(self, x):
+        return jnp.where(x < 0, -1., 1.) * jnp.log(jnp.abs(self.alpha * x) + 1)
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def nonzero_sign_log(
@@ -613,96 +619,97 @@ def nonzero_sign_log(
     alpha: float = 1.,
 ):
-  r"""Judge spiking state with a nonzero sign log function.
+    r"""Judge spiking state with a nonzero sign log function.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     g(x) = \mathrm{NonzeroSign}(x) \log (|\alpha x| + 1)
+       g(x) = \mathrm{NonzeroSign}(x) \log (|\alpha x| + 1)
-  where
+    where
-  .. math::
+    .. math::
-     \begin{split}\mathrm{NonzeroSign}(x) =
-      \begin{cases}
-      1, & x \geq 0 \\
-      -1, & x < 0 \\
-      \end{cases}\end{split}
+       \begin{split}\mathrm{NonzeroSign}(x) =
+        \begin{cases}
+        1, & x \geq 0 \\
+        -1, & x < 0 \\
+        \end{cases}\end{split}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \frac{\alpha}{1 + |\alpha x|} = \frac{1}{\frac{1}{\alpha} + |x|}
+       g'(x) = \frac{\alpha}{1 + |\alpha x|} = \frac{1}{\frac{1}{\alpha} + |x|}
-  This surrogate function has the advantage of low computation cost during the backward.
+    This surrogate function has the advantage of low computation cost during the backward.
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for alpha in [0.5, 1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.nonzero_sign_log)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for alpha in [0.5, 1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.nonzero_sign_log)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
-  """
-  return NonzeroSignLog(alpha=alpha)(x)
+    """
+    return NonzeroSignLog(alpha=alpha)(x)
 class ERF(Surrogate):
-  """Judge spiking state with an erf function.
+    """Judge spiking state with an erf function.
-  See Also
-  --------
-  erf
-  """
+    See Also
+    --------
+    erf
+    """
-  def __init__(self, alpha=1.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha=1.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = (self.alpha / jnp.sqrt(jnp.pi)) * jnp.exp(-jnp.power(self.alpha, 2) * x * x)
-    return dx
+    def surrogate_grad(self, x):
+        dx = (self.alpha / jnp.sqrt(jnp.pi)) * jnp.exp(-jnp.power(self.alpha, 2) * x * x)
+        return dx
-  def surrogate_fun(self, x):
-    return sci.special.erf(-self.alpha * x) * 0.5
+    def surrogate_fun(self, x):
+        return sci.special.erf(-self.alpha * x) * 0.5
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def erf(
@@ -710,99 +717,100 @@ def erf(
     alpha: float = 1.,
 ):
-  r"""Judge spiking state with an erf function [1]_ [2]_ [3]_.
+    r"""Judge spiking state with an erf function [1]_ [2]_ [3]_.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     \begin{split}
-      g(x) &= \frac{1}{2}(1-\text{erf}(-\alpha x)) \\
-      &= \frac{1}{2} \text{erfc}(-\alpha x) \\
-      &= \frac{1}{\sqrt{\pi}}\int_{-\infty}^{\alpha x}e^{-t^2}dt
-      \end{split}
+       \begin{split}
+        g(x) &= \frac{1}{2}(1-\text{erf}(-\alpha x)) \\
+        &= \frac{1}{2} \text{erfc}(-\alpha x) \\
+        &= \frac{1}{\sqrt{\pi}}\int_{-\infty}^{\alpha x}e^{-t^2}dt
+        \end{split}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \frac{\alpha}{\sqrt{\pi}}e^{-\alpha^2x^2}
+       g'(x) = \frac{\alpha}{\sqrt{\pi}}e^{-\alpha^2x^2}
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for alpha in [0.5, 1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.nonzero_sign_log)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for alpha in [0.5, 1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.nonzero_sign_log)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
-  References
-  ----------
-  .. [1] Esser S K, Appuswamy R, Merolla P, et al. Backpropagation for energy-efficient neuromorphic computing[J]. Advances in neural information processing systems, 2015, 28: 1117-1125.
-  .. [2] Wu Y, Deng L, Li G, et al. Spatio-temporal backpropagation for training high-performance spiking neural networks[J]. Frontiers in neuroscience, 2018, 12: 331.
-  .. [3] Yin B, Corradi F, Bohté S M. Effective and efficient computation with multiple-timescale spiking recurrent neural networks[C]//International Conference on Neuromorphic Systems 2020. 2020: 1-8.
+    References
+    ----------
+    .. [1] Esser S K, Appuswamy R, Merolla P, et al. Backpropagation for energy-efficient neuromorphic computing[J]. Advances in neural information processing systems, 2015, 28: 1117-1125.
+    .. [2] Wu Y, Deng L, Li G, et al. Spatio-temporal backpropagation for training high-performance spiking neural networks[J]. Frontiers in neuroscience, 2018, 12: 331.
+    .. [3] Yin B, Corradi F, Bohté S M. Effective and efficient computation with multiple-timescale spiking recurrent neural networks[C]//International Conference on Neuromorphic Systems 2020. 2020: 1-8.
-  """
-  return ERF(alpha=alpha)(x)
+    """
+    return ERF(alpha=alpha)(x)
 class PiecewiseLeakyRelu(Surrogate):
-  """Judge spiking state with a piecewise leaky relu function.
+    """Judge spiking state with a piecewise leaky relu function.
-  See Also
-  --------
-  piecewise_leaky_relu
-  """
+    See Also
+    --------
+    piecewise_leaky_relu
+    """
-  def __init__(self, c=0.01, w=1.):
-    super().__init__()
-    self.c = c
-    self.w = w
+    def __init__(self, c=0.01, w=1.):
+        super().__init__()
+        self.c = c
+        self.w = w
-  def surrogate_fun(self, x):
-    z = jnp.where(x < -self.w,
-                  self.c * x + self.c * self.w,
-                  jnp.where(x > self.w,
-                            self.c * x - self.c * self.w + 1,
-                            0.5 * x / self.w + 0.5))
-    return z
+    def surrogate_fun(self, x):
+        z = jnp.where(x < -self.w,
+                      self.c * x + self.c * self.w,
+                      jnp.where(x > self.w,
+                                self.c * x - self.c * self.w + 1,
+                                0.5 * x / self.w + 0.5))
+        return z
-  def surrogate_grad(self, x):
-    dx = jnp.where(jnp.abs(x) > self.w, self.c, 1 / self.w)
-    return dx
+    def surrogate_grad(self, x):
+        dx = jnp.where(jnp.abs(x) > self.w, self.c, 1 / self.w)
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(c={self.c}, w={self.w})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(c={self.c}, w={self.w})'
-  def __hash__(self):
-    return hash((self.__class__, self.c, self.w))
+    def __hash__(self):
+        return hash((self.__class__, self.c, self.w))
 def piecewise_leaky_relu(
@@ -811,119 +819,120 @@ def piecewise_leaky_relu(
     w: float = 1.,
 ):
-  r"""Judge spiking state with a piecewise leaky relu function [1]_ [2]_ [3]_ [4]_ [5]_ [6]_ [7]_ [8]_.
+    r"""Judge spiking state with a piecewise leaky relu function [1]_ [2]_ [3]_ [4]_ [5]_ [6]_ [7]_ [8]_.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
-  If `origin=True`, computes the original function:
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  .. math::
+    If `origin=True`, computes the original function:
-     \begin{split}g(x) =
-      \begin{cases}
-      cx + cw, & x < -w \\
-      \frac{1}{2w}x + \frac{1}{2}, & -w \leq x \leq w \\
-      cx - cw + 1, & x > w \\
-      \end{cases}\end{split}
+    .. math::
-  Backward function:
+       \begin{split}g(x) =
+        \begin{cases}
+        cx + cw, & x < -w \\
+        \frac{1}{2w}x + \frac{1}{2}, & -w \leq x \leq w \\
+        cx - cw + 1, & x > w \\
+        \end{cases}\end{split}
-  .. math::
+    Backward function:
-     \begin{split}g'(x) =
-      \begin{cases}
-      \frac{1}{w}, & |x| \leq w \\
-      c, & |x| > w
-      \end{cases}\end{split}
+    .. math::
-  .. plot::
-     :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for c in [0.01, 0.05, 0.1]:
-     >>>   for w in [1., 2.]:
-     >>>     grads1 = bst.transform.vector_grad(nn.surrogate.piecewise_leaky_relu)(xs, c=c, w=w)
-     >>>     plt.plot(xs, grads1, label=f'x={c}, w={w}')
-     >>> plt.legend()
-     >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  c: float
-    When :math:`|x| > w` the gradient is `c`.
-  w: float
-    When :math:`|x| <= w` the gradient is `1 / w`.
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
-  References
-  ----------
-  .. [1] Yin S, Venkataramanaiah S K, Chen G K, et al. Algorithm and hardware design of discrete-time spiking neural networks based on back propagation with binary activations[C]//2017 IEEE Biomedical Circuits and Systems Conference (BioCAS). IEEE, 2017: 1-5.
-  .. [2] Wu Y, Deng L, Li G, et al. Spatio-temporal backpropagation for training high-performance spiking neural networks[J]. Frontiers in neuroscience, 2018, 12: 331.
-  .. [3] Huh D, Sejnowski T J. Gradient descent for spiking neural networks[C]//Proceedings of the 32nd International Conference on Neural Information Processing Systems. 2018: 1440-1450.
-  .. [4] Wu Y, Deng L, Li G, et al. Direct training for spiking neural networks: Faster, larger, better[C]//Proceedings of the AAAI Conference on Artificial Intelligence. 2019, 33(01): 1311-1318.
-  .. [5] Gu P, Xiao R, Pan G, et al. STCA: Spatio-Temporal Credit Assignment with Delayed Feedback in Deep Spiking Neural Networks[C]//IJCAI. 2019: 1366-1372.
-  .. [6] Roy D, Chakraborty I, Roy K. Scaling deep spiking neural networks with binary stochastic activations[C]//2019 IEEE International Conference on Cognitive Computing (ICCC). IEEE, 2019: 50-58.
-  .. [7] Cheng X, Hao Y, Xu J, et al. LISNN: Improving Spiking Neural Networks with Lateral Interactions for Robust Object Recognition[C]//IJCAI. 1519-1525.
-  .. [8] Kaiser J, Mostafa H, Neftci E. Synaptic plasticity dynamics for deep continuous local learning (DECOLLE)[J]. Frontiers in Neuroscience, 2020, 14: 424.
-  """
-  return PiecewiseLeakyRelu(c=c, w=w)(x)
+       \begin{split}g'(x) =
+        \begin{cases}
+        \frac{1}{w}, & |x| \leq w \\
+        c, & |x| > w
+        \end{cases}\end{split}
+    .. plot::
+       :include-source: True
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for c in [0.01, 0.05, 0.1]:
+       >>>   for w in [1., 2.]:
+       >>>     grads1 = bst.augment.vector_grad(bst.surrogate.piecewise_leaky_relu)(xs, c=c, w=w)
+       >>>     plt.plot(xs, grads1, label=f'x={c}, w={w}')
+       >>> plt.legend()
+       >>> plt.show()
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    c: float
+      When :math:`|x| > w` the gradient is `c`.
+    w: float
+      When :math:`|x| <= w` the gradient is `1 / w`.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    References
+    ----------
+    .. [1] Yin S, Venkataramanaiah S K, Chen G K, et al. Algorithm and hardware design of discrete-time spiking neural networks based on back propagation with binary activations[C]//2017 IEEE Biomedical Circuits and Systems Conference (BioCAS). IEEE, 2017: 1-5.
+    .. [2] Wu Y, Deng L, Li G, et al. Spatio-temporal backpropagation for training high-performance spiking neural networks[J]. Frontiers in neuroscience, 2018, 12: 331.
+    .. [3] Huh D, Sejnowski T J. Gradient descent for spiking neural networks[C]//Proceedings of the 32nd International Conference on Neural Information Processing Systems. 2018: 1440-1450.
+    .. [4] Wu Y, Deng L, Li G, et al. Direct training for spiking neural networks: Faster, larger, better[C]//Proceedings of the AAAI Conference on Artificial Intelligence. 2019, 33(01): 1311-1318.
+    .. [5] Gu P, Xiao R, Pan G, et al. STCA: Spatio-Temporal Credit Assignment with Delayed Feedback in Deep Spiking Neural Networks[C]//IJCAI. 2019: 1366-1372.
+    .. [6] Roy D, Chakraborty I, Roy K. Scaling deep spiking neural networks with binary stochastic activations[C]//2019 IEEE International Conference on Cognitive Computing (ICCC). IEEE, 2019: 50-58.
+    .. [7] Cheng X, Hao Y, Xu J, et al. LISNN: Improving Spiking Neural Networks with Lateral Interactions for Robust Object Recognition[C]//IJCAI. 1519-1525.
+    .. [8] Kaiser J, Mostafa H, Neftci E. Synaptic plasticity dynamics for deep continuous local learning (DECOLLE)[J]. Frontiers in Neuroscience, 2020, 14: 424.
+    """
+    return PiecewiseLeakyRelu(c=c, w=w)(x)
 class SquarewaveFourierSeries(Surrogate):
-  """Judge spiking state with a squarewave fourier series.
+    """Judge spiking state with a squarewave fourier series.
-  See Also
-  --------
-  squarewave_fourier_series
-  """
+    See Also
+    --------
+    squarewave_fourier_series
+    """
-  def __init__(self, n=2, t_period=8.):
-    super().__init__()
-    self.n = n
-    self.t_period = t_period
+    def __init__(self, n=2, t_period=8.):
+        super().__init__()
+        self.n = n
+        self.t_period = t_period
-  def surrogate_grad(self, x):
+    def surrogate_grad(self, x):
-    w = jnp.pi * 2. / self.t_period
-    dx = jnp.cos(w * x)
-    for i in range(2, self.n):
-      dx += jnp.cos((2 * i - 1.) * w * x)
-    dx *= 4. / self.t_period
-    return dx
+        w = jnp.pi * 2. / self.t_period
+        dx = jnp.cos(w * x)
+        for i in range(2, self.n):
+            dx += jnp.cos((2 * i - 1.) * w * x)
+        dx *= 4. / self.t_period
+        return dx
-  def surrogate_fun(self, x):
+    def surrogate_fun(self, x):
-    w = jnp.pi * 2. / self.t_period
-    ret = jnp.sin(w * x)
-    for i in range(2, self.n):
-      c = (2 * i - 1.)
-      ret += jnp.sin(c * w * x) / c
-    z = 0.5 + 2. / jnp.pi * ret
-    return z
+        w = jnp.pi * 2. / self.t_period
+        ret = jnp.sin(w * x)
+        for i in range(2, self.n):
+            c = (2 * i - 1.)
+            ret += jnp.sin(c * w * x) / c
+        z = 0.5 + 2. / jnp.pi * ret
+        return z
-  def __repr__(self):
-    return f'{self.__class__.__name__}(n={self.n}, t_period={self.t_period})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(n={self.n}, t_period={self.t_period})'
-  def __hash__(self):
-    return hash((self.__class__, self.n, self.t_period))
+    def __hash__(self):
+        return hash((self.__class__, self.n, self.t_period))
 def squarewave_fourier_series(
@@ -932,91 +941,92 @@ def squarewave_fourier_series(
     t_period: float = 8.,
 ):
-  r"""Judge spiking state with a squarewave fourier series.
+    r"""Judge spiking state with a squarewave fourier series.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     g(x) = 0.5 + \frac{1}{\pi}*\sum_{i=1}^n {\sin\left({(2i-1)*2\pi}*x/T\right) \over 2i-1 }
+       g(x) = 0.5 + \frac{1}{\pi}*\sum_{i=1}^n {\sin\left({(2i-1)*2\pi}*x/T\right) \over 2i-1 }
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \sum_{i=1}^n\frac{4\cos\left((2 * i - 1.) * 2\pi * x / T\right)}{T}
+       g'(x) = \sum_{i=1}^n\frac{4\cos\left((2 * i - 1.) * 2\pi * x / T\right)}{T}
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for n in [2, 4, 8]:
-     >>>   f = nn.surrogate.SquarewaveFourierSeries(n=n)
-     >>>   grads1 = bst.transform.vector_grad(f)(xs)
-     >>>   plt.plot(xs, grads1, label=f'n={n}')
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for n in [2, 4, 8]:
+       >>>   f = bst.surrogate.SquarewaveFourierSeries(n=n)
+       >>>   grads1 = bst.augment.vector_grad(f)(xs)
+       >>>   plt.plot(xs, grads1, label=f'n={n}')
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  n: int
-  t_period: float
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    n: int
+    t_period: float
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
-  """
+    """
-  return SquarewaveFourierSeries(n=n, t_period=t_period)(x)
+    return SquarewaveFourierSeries(n=n, t_period=t_period)(x)
 class S2NN(Surrogate):
-  """Judge spiking state with the S2NN surrogate spiking function.
+    """Judge spiking state with the S2NN surrogate spiking function.
-  See Also
-  --------
-  s2nn
-  """
+    See Also
+    --------
+    s2nn
+    """
-  def __init__(self, alpha=4., beta=1., epsilon=1e-8):
-    super().__init__()
-    self.alpha = alpha
-    self.beta = beta
-    self.epsilon = epsilon
+    def __init__(self, alpha=4., beta=1., epsilon=1e-8):
+        super().__init__()
+        self.alpha = alpha
+        self.beta = beta
+        self.epsilon = epsilon
-  def surrogate_fun(self, x):
-    z = jnp.where(x < 0.,
-                  sci.special.expit(x * self.alpha),
-                  self.beta * jnp.log(jnp.abs((x + 1.)) + self.epsilon) + 0.5)
-    return z
+    def surrogate_fun(self, x):
+        z = jnp.where(x < 0.,
+                      sci.special.expit(x * self.alpha),
+                      self.beta * jnp.log(jnp.abs((x + 1.)) + self.epsilon) + 0.5)
+        return z
-  def surrogate_grad(self, x):
-    sg = sci.special.expit(self.alpha * x)
-    dx = jnp.where(x < 0., self.alpha * sg * (1. - sg), self.beta / (x + 1.))
-    return dx
+    def surrogate_grad(self, x):
+        sg = sci.special.expit(self.alpha * x)
+        dx = jnp.where(x < 0., self.alpha * sg * (1. - sg), self.beta / (x + 1.))
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha}, beta={self.beta}, epsilon={self.epsilon})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha}, beta={self.beta}, epsilon={self.epsilon})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha, self.beta, self.epsilon))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha, self.beta, self.epsilon))
 def s2nn(
@@ -1026,101 +1036,102 @@ def s2nn(
     epsilon: float = 1e-8,
 ):
-  r"""Judge spiking state with the S2NN surrogate spiking function [1]_.
-  If `origin=False`, computes the forward function:
-  .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+    r"""Judge spiking state with the S2NN surrogate spiking function [1]_.
-  If `origin=True`, computes the original function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     \begin{split}g(x) = \begin{cases}
-        \mathrm{sigmoid} (\alpha x), x < 0 \\
-        \beta \ln(|x + 1|) + 0.5, x \ge 0
-    \end{cases}\end{split}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  Backward function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     \begin{split}g'(x) = \begin{cases}
-        \alpha * (1 - \mathrm{sigmoid} (\alpha x)) \mathrm{sigmoid} (\alpha x), x < 0 \\
-        \frac{\beta}{(x + 1)}, x \ge 0
-    \end{cases}\end{split}
-  .. plot::
-     :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> grads = bst.transform.vector_grad(nn.surrogate.s2nn)(xs, 4., 1.)
-     >>> plt.plot(xs, grads, label=r'$\alpha=4, \beta=1$')
-     >>> grads = bst.transform.vector_grad(nn.surrogate.s2nn)(xs, 8., 2.)
-     >>> plt.plot(xs, grads, label=r'$\alpha=8, \beta=2$')
-     >>> plt.legend()
-     >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    The param that controls the gradient when ``x < 0``.
-  beta: float
-    The param that controls the gradient when ``x >= 0``
-  epsilon: float
-    Avoid nan
+       \begin{split}g(x) = \begin{cases}
+          \mathrm{sigmoid} (\alpha x), x < 0 \\
+          \beta \ln(|x + 1|) + 0.5, x \ge 0
+      \end{cases}\end{split}
+    Backward function:
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    .. math::
-  References
-  ----------
-  .. [1] Suetake, Kazuma et al. “S2NN: Time Step Reduction of Spiking Surrogate Gradients for Training Energy Efficient Single-Step Neural Networks.” ArXiv abs/2201.10879 (2022): n. pag.
+       \begin{split}g'(x) = \begin{cases}
+          \alpha * (1 - \mathrm{sigmoid} (\alpha x)) \mathrm{sigmoid} (\alpha x), x < 0 \\
+          \frac{\beta}{(x + 1)}, x \ge 0
+      \end{cases}\end{split}
-  """
-  return S2NN(alpha=alpha, beta=beta, epsilon=epsilon)(x)
+    .. plot::
+       :include-source: True
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> grads = bst.augment.vector_grad(bst.surrogate.s2nn)(xs, 4., 1.)
+       >>> plt.plot(xs, grads, label=r'$\alpha=4, \beta=1$')
+       >>> grads = bst.augment.vector_grad(bst.surrogate.s2nn)(xs, 8., 2.)
+       >>> plt.plot(xs, grads, label=r'$\alpha=8, \beta=2$')
+       >>> plt.legend()
+       >>> plt.show()
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      The param that controls the gradient when ``x < 0``.
+    beta: float
+      The param that controls the gradient when ``x >= 0``
+    epsilon: float
+      Avoid nan
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    References
+    ----------
+    .. [1] Suetake, Kazuma et al. “S2NN: Time Step Reduction of Spiking Surrogate Gradients for Training Energy Efficient Single-Step Neural Networks.” ArXiv abs/2201.10879 (2022): n. pag.
+    """
+    return S2NN(alpha=alpha, beta=beta, epsilon=epsilon)(x)
 class QPseudoSpike(Surrogate):
-  """Judge spiking state with the q-PseudoSpike surrogate function.
+    """Judge spiking state with the q-PseudoSpike surrogate function.
-  See Also
-  --------
-  q_pseudo_spike
-  """
+    See Also
+    --------
+    q_pseudo_spike
+    """
-  def __init__(self, alpha=2.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha=2.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = jnp.power(1 + 2 / (self.alpha + 1) * jnp.abs(x), -self.alpha)
-    return dx
+    def surrogate_grad(self, x):
+        dx = jnp.power(1 + 2 / (self.alpha + 1) * jnp.abs(x), -self.alpha)
+        return dx
-  def surrogate_fun(self, x):
-    z = jnp.where(x < 0.,
-                  0.5 * jnp.power(1 - 2 / (self.alpha - 1) * jnp.abs(x), 1 - self.alpha),
-                  1. - 0.5 * jnp.power(1 + 2 / (self.alpha - 1) * jnp.abs(x), 1 - self.alpha))
-    return z
+    def surrogate_fun(self, x):
+        z = jnp.where(x < 0.,
+                      0.5 * jnp.power(1 - 2 / (self.alpha - 1) * jnp.abs(x), 1 - self.alpha),
+                      1. - 0.5 * jnp.power(1 + 2 / (self.alpha - 1) * jnp.abs(x), 1 - self.alpha))
+        return z
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def q_pseudo_spike(
@@ -1128,91 +1139,92 @@ def q_pseudo_spike(
     alpha: float = 2.,
 ):
-  r"""Judge spiking state with the q-PseudoSpike surrogate function [1]_.
+    r"""Judge spiking state with the q-PseudoSpike surrogate function [1]_.
-  If `origin=False`, computes the forward function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  If `origin=True`, computes the original function:
+    If `origin=True`, computes the original function:
-  .. math::
+    .. math::
-     \begin{split}g(x) =
-      \begin{cases}
-      \frac{1}{2}(1-\frac{2x}{\alpha-1})^{1-\alpha}, & x < 0 \\
-      1 - \frac{1}{2}(1+\frac{2x}{\alpha-1})^{1-\alpha}, & x \geq 0.
-      \end{cases}\end{split}
+       \begin{split}g(x) =
+        \begin{cases}
+        \frac{1}{2}(1-\frac{2x}{\alpha-1})^{1-\alpha}, & x < 0 \\
+        1 - \frac{1}{2}(1+\frac{2x}{\alpha-1})^{1-\alpha}, & x \geq 0.
+        \end{cases}\end{split}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = (1+\frac{2|x|}{\alpha-1})^{-\alpha}
+       g'(x) = (1+\frac{2|x|}{\alpha-1})^{-\alpha}
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for alpha in [0.5, 1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.q_pseudo_spike)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha=$' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for alpha in [0.5, 1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.q_pseudo_spike)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha=$' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    The parameter to control tail fatness of gradient.
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      The parameter to control tail fatness of gradient.
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
-  References
-  ----------
-  .. [1] Herranz-Celotti, Luca and Jean Rouat. “Surrogate Gradients Design.” ArXiv abs/2202.00282 (2022): n. pag.
-  """
-  return QPseudoSpike(alpha=alpha)(x)
+    References
+    ----------
+    .. [1] Herranz-Celotti, Luca and Jean Rouat. “Surrogate Gradients Design.” ArXiv abs/2202.00282 (2022): n. pag.
+    """
+    return QPseudoSpike(alpha=alpha)(x)
 class LeakyRelu(Surrogate):
-  """Judge spiking state with the Leaky ReLU function.
+    """Judge spiking state with the Leaky ReLU function.
-  See Also
-  --------
-  leaky_relu
-  """
+    See Also
+    --------
+    leaky_relu
+    """
-  def __init__(self, alpha=0.1, beta=1.):
-    super().__init__()
-    self.alpha = alpha
-    self.beta = beta
+    def __init__(self, alpha=0.1, beta=1.):
+        super().__init__()
+        self.alpha = alpha
+        self.beta = beta
-  def surrogate_fun(self, x):
-    return jnp.where(x < 0., self.alpha * x, self.beta * x)
+    def surrogate_fun(self, x):
+        return jnp.where(x < 0., self.alpha * x, self.beta * x)
-  def surrogate_grad(self, x):
-    dx = jnp.where(x < 0., self.alpha, self.beta)
-    return dx
+    def surrogate_grad(self, x):
+        dx = jnp.where(x < 0., self.alpha, self.beta)
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha}, beta={self.beta})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha}, beta={self.beta})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha, self.beta))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha, self.beta))
 def leaky_relu(
@@ -1221,100 +1233,101 @@ def leaky_relu(
     beta: float = 1.,
 ):
-  r"""Judge spiking state with the Leaky ReLU function.
+    r"""Judge spiking state with the Leaky ReLU function.
-  If `origin=False`, computes the forward function:
-  .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+    If `origin=False`, computes the forward function:
-  If `origin=True`, computes the original function:
+    .. math::
-  .. math::
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-     \begin{split}g(x) =
-      \begin{cases}
-      \beta \cdot x, & x \geq 0 \\
-      \alpha \cdot x, & x < 0 \\
-      \end{cases}\end{split}
-  Backward function:
-  .. math::
-     \begin{split}g'(x) =
-      \begin{cases}
-      \beta, & x \geq 0 \\
-      \alpha, & x < 0 \\
-      \end{cases}\end{split}
+    If `origin=True`, computes the original function:
-  .. plot::
-     :include-source: True
+    .. math::
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> grads = bst.transform.vector_grad(nn.surrogate.leaky_relu)(xs, 0., 1.)
-     >>> plt.plot(xs, grads, label=r'$\alpha=0., \beta=1.$')
-     >>> plt.legend()
-     >>> plt.show()
+       \begin{split}g(x) =
+        \begin{cases}
+        \beta \cdot x, & x \geq 0 \\
+        \alpha \cdot x, & x < 0 \\
+        \end{cases}\end{split}
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    The parameter to control the gradient when :math:`x < 0`.
-  beta: float
-    The parameter to control the  gradient when :math:`x >= 0`.
+    Backward function:
+    .. math::
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
-  """
-  return LeakyRelu(alpha=alpha, beta=beta)(x)
+       \begin{split}g'(x) =
+        \begin{cases}
+        \beta, & x \geq 0 \\
+        \alpha, & x < 0 \\
+        \end{cases}\end{split}
+    .. plot::
+       :include-source: True
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> grads = bst.augment.vector_grad(bst.surrogate.leaky_relu)(xs, 0., 1.)
+       >>> plt.plot(xs, grads, label=r'$\alpha=0., \beta=1.$')
+       >>> plt.legend()
+       >>> plt.show()
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      The parameter to control the gradient when :math:`x < 0`.
+    beta: float
+      The parameter to control the  gradient when :math:`x >= 0`.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    """
+    return LeakyRelu(alpha=alpha, beta=beta)(x)
 class LogTailedRelu(Surrogate):
-  """Judge spiking state with the Log-tailed ReLU function.
+    """Judge spiking state with the Log-tailed ReLU function.
-  See Also
-  --------
-  log_tailed_relu
-  """
+    See Also
+    --------
+    log_tailed_relu
+    """
-  def __init__(self, alpha=0.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha=0.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_fun(self, x):
-    z = jnp.where(x > 1,
-                  jnp.log(x),
-                  jnp.where(x > 0,
-                            x,
-                            self.alpha * x))
-    return z
+    def surrogate_fun(self, x):
+        z = jnp.where(x > 1,
+                      jnp.log(x),
+                      jnp.where(x > 0,
+                                x,
+                                self.alpha * x))
+        return z
-  def surrogate_grad(self, x):
-    dx = jnp.where(x > 1,
-                   1 / x,
-                   jnp.where(x > 0,
-                             1.,
-                             self.alpha))
-    return dx
+    def surrogate_grad(self, x):
+        dx = jnp.where(x > 1,
+                       1 / x,
+                       jnp.where(x > 0,
+                                 1.,
+                                 self.alpha))
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def log_tailed_relu(
@@ -1322,93 +1335,94 @@ def log_tailed_relu(
     alpha: float = 0.,
 ):
-  r"""Judge spiking state with the Log-tailed ReLU function [1]_.
-  If `origin=False`, computes the forward function:
-  .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+    r"""Judge spiking state with the Log-tailed ReLU function [1]_.
-  If `origin=True`, computes the original function:
+    If `origin=False`, computes the forward function:
-  .. math::
+    .. math::
-     \begin{split}g(x) =
-      \begin{cases}
-      \alpha x, & x \leq 0 \\
-      x, & 0 < x \leq 0 \\
-      log(x), x > 1 \\
-      \end{cases}\end{split}
-  Backward function:
-  .. math::
-     \begin{split}g'(x) =
-      \begin{cases}
-      \alpha, & x \leq 0 \\
-      1, & 0 < x \leq 0 \\
-      \frac{1}{x}, x > 1 \\
-      \end{cases}\end{split}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  .. plot::
-     :include-source: True
+    If `origin=True`, computes the original function:
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> grads = bst.transform.vector_grad(nn.surrogate.leaky_relu)(xs, 0., 1.)
-     >>> plt.plot(xs, grads, label=r'$\alpha=0., \beta=1.$')
-     >>> plt.legend()
-     >>> plt.show()
+    .. math::
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    The parameter to control the gradient.
+       \begin{split}g(x) =
+        \begin{cases}
+        \alpha x, & x \leq 0 \\
+        x, & 0 < x \leq 0 \\
+        log(x), x > 1 \\
+        \end{cases}\end{split}
+    Backward function:
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    .. math::
-  References
-  ----------
-  .. [1] Cai, Zhaowei et al. “Deep Learning with Low Precision by Half-Wave Gaussian Quantization.” 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2017): 5406-5414.
-  """
-  return LogTailedRelu(alpha=alpha)(x)
+       \begin{split}g'(x) =
+        \begin{cases}
+        \alpha, & x \leq 0 \\
+        1, & 0 < x \leq 0 \\
+        \frac{1}{x}, x > 1 \\
+        \end{cases}\end{split}
+    .. plot::
+       :include-source: True
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> grads = bst.augment.vector_grad(bst.surrogate.leaky_relu)(xs, 0., 1.)
+       >>> plt.plot(xs, grads, label=r'$\alpha=0., \beta=1.$')
+       >>> plt.legend()
+       >>> plt.show()
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      The parameter to control the gradient.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    References
+    ----------
+    .. [1] Cai, Zhaowei et al. “Deep Learning with Low Precision by Half-Wave Gaussian Quantization.” 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2017): 5406-5414.
+    """
+    return LogTailedRelu(alpha=alpha)(x)
 class ReluGrad(Surrogate):
-  """Judge spiking state with the ReLU gradient function.
+    """Judge spiking state with the ReLU gradient function.
-  See Also
-  --------
-  relu_grad
-  """
+    See Also
+    --------
+    relu_grad
+    """
-  def __init__(self, alpha=0.3, width=1.):
-    super().__init__()
-    self.alpha = alpha
-    self.width = width
+    def __init__(self, alpha=0.3, width=1.):
+        super().__init__()
+        self.alpha = alpha
+        self.width = width
-  def surrogate_grad(self, x):
-    dx = jnp.maximum(self.alpha * self.width - jnp.abs(x) * self.alpha, 0)
-    return dx
+    def surrogate_grad(self, x):
+        dx = jnp.maximum(self.alpha * self.width - jnp.abs(x) * self.alpha, 0)
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha}, width={self.width})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha}, width={self.width})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha, self.width))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha, self.width))
 def relu_grad(
@@ -1416,80 +1430,81 @@ def relu_grad(
     alpha: float = 0.3,
     width: float = 1.,
 ):
-  r"""Spike function with the ReLU gradient function [1]_.
+    r"""Spike function with the ReLU gradient function [1]_.
-  The forward function:
+    The forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
-  Backward function:
-  .. math::
-     g'(x) = \text{ReLU}(\alpha * (\mathrm{width}-|x|))
-  .. plot::
-     :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for s in [0.5, 1.]:
-     >>>   for w in [1, 2.]:
-     >>>     grads = bst.transform.vector_grad(nn.surrogate.relu_grad)(xs, s, w)
-     >>>     plt.plot(xs, grads, label=r'$\alpha=$' + f'{s}, width={w}')
-     >>> plt.legend()
-     >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    The parameter to control the gradient.
-  width: float
-    The parameter to control the width of the gradient.
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
-  References
-  ----------
-  .. [1] Neftci, E. O., Mostafa, H. & Zenke, F. Surrogate gradient learning in spiking neural networks. IEEE Signal Process. Mag. 36, 61–63 (2019).
-  """
-  return ReluGrad(alpha=alpha, width=width)(x)
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
+    Backward function:
+    .. math::
+       g'(x) = \text{ReLU}(\alpha * (\mathrm{width}-|x|))
+    .. plot::
+       :include-source: True
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for s in [0.5, 1.]:
+       >>>   for w in [1, 2.]:
+       >>>     grads = bst.augment.vector_grad(bst.surrogate.relu_grad)(xs, s, w)
+       >>>     plt.plot(xs, grads, label=r'$\alpha=$' + f'{s}, width={w}')
+       >>> plt.legend()
+       >>> plt.show()
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      The parameter to control the gradient.
+    width: float
+      The parameter to control the width of the gradient.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    References
+    ----------
+    .. [1] Neftci, E. O., Mostafa, H. & Zenke, F. Surrogate gradient learning in spiking neural networks. IEEE Signal Process. Mag. 36, 61–63 (2019).
+    """
+    return ReluGrad(alpha=alpha, width=width)(x)
 class GaussianGrad(Surrogate):
-  """Judge spiking state with the Gaussian gradient function.
+    """Judge spiking state with the Gaussian gradient function.
-  See Also
-  --------
-  gaussian_grad
-  """
+    See Also
+    --------
+    gaussian_grad
+    """
-  def __init__(self, sigma=0.5, alpha=0.5):
-    super().__init__()
-    self.sigma = sigma
-    self.alpha = alpha
+    def __init__(self, sigma=0.5, alpha=0.5):
+        super().__init__()
+        self.sigma = sigma
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = jnp.exp(-(x ** 2) / 2 * jnp.power(self.sigma, 2)) / (jnp.sqrt(2 * jnp.pi) * self.sigma)
-    return self.alpha * dx
+    def surrogate_grad(self, x):
+        dx = jnp.exp(-(x ** 2) / 2 * jnp.power(self.sigma, 2)) / (jnp.sqrt(2 * jnp.pi) * self.sigma)
+        return self.alpha * dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha}, sigma={self.sigma})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha}, sigma={self.sigma})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha, self.sigma))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha, self.sigma))
 def gaussian_grad(
@@ -1497,86 +1512,87 @@ def gaussian_grad(
     sigma: float = 0.5,
     alpha: float = 0.5,
 ):
-  r"""Spike function with the Gaussian gradient function [1]_.
+    r"""Spike function with the Gaussian gradient function [1]_.
-  The forward function:
+    The forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \alpha * \text{gaussian}(x, 0., \sigma)
+       g'(x) = \alpha * \text{gaussian}(x, 0., \sigma)
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for s in [0.5, 1., 2.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.gaussian_grad)(xs, s, 0.5)
-     >>>   plt.plot(xs, grads, label=r'$\alpha=0.5, \sigma=$' + str(s))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for s in [0.5, 1., 2.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.gaussian_grad)(xs, s, 0.5)
+       >>>   plt.plot(xs, grads, label=r'$\alpha=0.5, \sigma=$' + str(s))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  sigma: float
-    The parameter to control the variance of gaussian distribution.
-  alpha: float
-    The parameter to control the scale of the gradient.
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    sigma: float
+      The parameter to control the variance of gaussian distribution.
+    alpha: float
+      The parameter to control the scale of the gradient.
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
-  References
-  ----------
-  .. [1] Yin, B., Corradi, F. & Bohté, S.M. Accurate and efficient time-domain classification with adaptive spiking recurrent neural networks. Nat Mach Intell 3, 905–913 (2021).
-  """
-  return GaussianGrad(sigma=sigma, alpha=alpha)(x)
+    References
+    ----------
+    .. [1] Yin, B., Corradi, F. & Bohté, S.M. Accurate and efficient time-domain classification with adaptive spiking recurrent neural networks. Nat Mach Intell 3, 905–913 (2021).
+    """
+    return GaussianGrad(sigma=sigma, alpha=alpha)(x)
 class MultiGaussianGrad(Surrogate):
-  """Judge spiking state with the multi-Gaussian gradient function.
+    """Judge spiking state with the multi-Gaussian gradient function.
-  See Also
-  --------
-  multi_gaussian_grad
-  """
+    See Also
+    --------
+    multi_gaussian_grad
+    """
-  def __init__(self, h=0.15, s=6.0, sigma=0.5, scale=0.5):
-    super().__init__()
-    self.h = h
-    self.s = s
-    self.sigma = sigma
-    self.scale = scale
+    def __init__(self, h=0.15, s=6.0, sigma=0.5, scale=0.5):
+        super().__init__()
+        self.h = h
+        self.s = s
+        self.sigma = sigma
+        self.scale = scale
-  def surrogate_grad(self, x):
-    g1 = jnp.exp(-x ** 2 / (2 * jnp.power(self.sigma, 2))) / (jnp.sqrt(2 * jnp.pi) * self.sigma)
-    g2 = jnp.exp(-(x - self.sigma) ** 2 / (2 * jnp.power(self.s * self.sigma, 2))
-                 ) / (jnp.sqrt(2 * jnp.pi) * self.s * self.sigma)
-    g3 = jnp.exp(-(x + self.sigma) ** 2 / (2 * jnp.power(self.s * self.sigma, 2))
-                 ) / (jnp.sqrt(2 * jnp.pi) * self.s * self.sigma)
-    dx = g1 * (1. + self.h) - g2 * self.h - g3 * self.h
-    return self.scale * dx
+    def surrogate_grad(self, x):
+        g1 = jnp.exp(-x ** 2 / (2 * jnp.power(self.sigma, 2))) / (jnp.sqrt(2 * jnp.pi) * self.sigma)
+        g2 = jnp.exp(-(x - self.sigma) ** 2 / (2 * jnp.power(self.s * self.sigma, 2))
+                     ) / (jnp.sqrt(2 * jnp.pi) * self.s * self.sigma)
+        g3 = jnp.exp(-(x + self.sigma) ** 2 / (2 * jnp.power(self.s * self.sigma, 2))
+                     ) / (jnp.sqrt(2 * jnp.pi) * self.s * self.sigma)
+        dx = g1 * (1. + self.h) - g2 * self.h - g3 * self.h
+        return self.scale * dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(h={self.h}, s={self.s}, sigma={self.sigma}, scale={self.scale})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(h={self.h}, s={self.s}, sigma={self.sigma}, scale={self.scale})'
-  def __hash__(self):
-    return hash((self.__class__, self.h, self.s, self.sigma, self.scale))
+    def __hash__(self):
+        return hash((self.__class__, self.h, self.s, self.sigma, self.scale))
 def multi_gaussian_grad(
@@ -1586,209 +1602,212 @@ def multi_gaussian_grad(
     sigma: float = 0.5,
     scale: float = 0.5,
 ):
-  r"""Spike function with the multi-Gaussian gradient function [1]_.
+    r"""Spike function with the multi-Gaussian gradient function [1]_.
-  The forward function:
+    The forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
-  Backward function:
-  .. math::
-     \begin{array}{l}
-     g'(x)=(1+h){{{\mathcal{N}}}}(x, 0, {\sigma }^{2})
-     -h{{{\mathcal{N}}}}(x, \sigma,{(s\sigma )}^{2})-
-     h{{{\mathcal{N}}}}(x, -\sigma ,{(s\sigma )}^{2})
-     \end{array}
-  .. plot::
-     :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> grads = bst.transform.vector_grad(nn.surrogate.multi_gaussian_grad)(xs)
-     >>> plt.plot(xs, grads)
-     >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  h: float
-    The hyper-parameters of approximate function
-  s: float
-    The hyper-parameters of approximate function
-  sigma: float
-    The gaussian sigma.
-  scale: float
-    The gradient scale.
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
-  References
-  ----------
-  .. [1] Yin, B., Corradi, F. & Bohté, S.M. Accurate and efficient time-domain classification with adaptive spiking recurrent neural networks. Nat Mach Intell 3, 905–913 (2021).
-  """
-  return MultiGaussianGrad(h=h, s=s, sigma=sigma, scale=scale)(x)
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
+    Backward function:
+    .. math::
+       \begin{array}{l}
+       g'(x)=(1+h){{{\mathcal{N}}}}(x, 0, {\sigma }^{2})
+       -h{{{\mathcal{N}}}}(x, \sigma,{(s\sigma )}^{2})-
+       h{{{\mathcal{N}}}}(x, -\sigma ,{(s\sigma )}^{2})
+       \end{array}
+    .. plot::
+       :include-source: True
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> grads = bst.augment.vector_grad(bst.surrogate.multi_gaussian_grad)(xs)
+       >>> plt.plot(xs, grads)
+       >>> plt.show()
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    h: float
+      The hyper-parameters of approximate function
+    s: float
+      The hyper-parameters of approximate function
+    sigma: float
+      The gaussian sigma.
+    scale: float
+      The gradient scale.
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    References
+    ----------
+    .. [1] Yin, B., Corradi, F. & Bohté, S.M. Accurate and efficient time-domain classification with adaptive spiking recurrent neural networks. Nat Mach Intell 3, 905–913 (2021).
+    """
+    return MultiGaussianGrad(h=h, s=s, sigma=sigma, scale=scale)(x)
 class InvSquareGrad(Surrogate):
-  """Judge spiking state with the inverse-square surrogate gradient function.
+    """Judge spiking state with the inverse-square surrogate gradient function.
-  See Also
-  --------
-  inv_square_grad
-  """
+    See Also
+    --------
+    inv_square_grad
+    """
-  def __init__(self, alpha=100.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha=100.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = 1. / (self.alpha * jnp.abs(x) + 1.0) ** 2
-    return dx
+    def surrogate_grad(self, x):
+        dx = 1. / (self.alpha * jnp.abs(x) + 1.0) ** 2
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def inv_square_grad(
     x: jax.Array,
     alpha: float = 100.
 ):
-  r"""Spike function with the inverse-square surrogate gradient.
+    r"""Spike function with the inverse-square surrogate gradient.
-  Forward function:
+    Forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
-  Backward function:
+    Backward function:
-  .. math::
+    .. math::
-     g'(x) = \frac{1}{(\alpha * |x| + 1.) ^ 2}
+       g'(x) = \frac{1}{(\alpha * |x| + 1.) ^ 2}
-  .. plot::
-     :include-source: True
+    .. plot::
+       :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-1, 1, 1000)
-     >>> for alpha in [1., 10., 100.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.inv_square_grad)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-1, 1, 1000)
+       >>> for alpha in [1., 10., 100.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.inv_square_grad)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
-  """
-  return InvSquareGrad(alpha=alpha)(x)
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    """
+    return InvSquareGrad(alpha=alpha)(x)
 class SlayerGrad(Surrogate):
-  """Judge spiking state with the slayer surrogate gradient function.
+    """Judge spiking state with the slayer surrogate gradient function.
-  See Also
-  --------
-  slayer_grad
-  """
+    See Also
+    --------
+    slayer_grad
+    """
-  def __init__(self, alpha=1.):
-    super().__init__()
-    self.alpha = alpha
+    def __init__(self, alpha=1.):
+        super().__init__()
+        self.alpha = alpha
-  def surrogate_grad(self, x):
-    dx = jnp.exp(-self.alpha * jnp.abs(x))
-    return dx
+    def surrogate_grad(self, x):
+        dx = jnp.exp(-self.alpha * jnp.abs(x))
+        return dx
-  def __repr__(self):
-    return f'{self.__class__.__name__}(alpha={self.alpha})'
+    def __repr__(self):
+        return f'{self.__class__.__name__}(alpha={self.alpha})'
-  def __hash__(self):
-    return hash((self.__class__, self.alpha))
+    def __hash__(self):
+        return hash((self.__class__, self.alpha))
 def slayer_grad(
     x: jax.Array,
     alpha: float = 1.
 ):
-  r"""Spike function with the slayer surrogate gradient function.
+    r"""Spike function with the slayer surrogate gradient function.
-  Forward function:
+    Forward function:
-  .. math::
+    .. math::
-     g(x) = \begin{cases}
-        1, & x \geq 0 \\
-        0, & x < 0 \\
-        \end{cases}
-  Backward function:
-  .. math::
-     g'(x) = \exp(-\alpha |x|)
-  .. plot::
-     :include-source: True
-     >>> import brainstate.nn as nn
-     >>> import brainstate as bst
-     >>> import matplotlib.pyplot as plt
-     >>> xs = jax.numpy.linspace(-3, 3, 1000)
-     >>> for alpha in [0.5, 1., 2., 4.]:
-     >>>   grads = bst.transform.vector_grad(nn.surrogate.slayer_grad)(xs, alpha)
-     >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
-     >>> plt.legend()
-     >>> plt.show()
-  Parameters
-  ----------
-  x: jax.Array, Array
-    The input data.
-  alpha: float
-    Parameter to control smoothness of gradient
-  Returns
-  -------
-  out: jax.Array
-    The spiking state.
-  References
-  ----------
-  .. [1] Shrestha, S. B. & Orchard, G. Slayer: spike layer error reassignment in time. In Advances in Neural Information Processing Systems Vol. 31, 1412–1421 (NeurIPS, 2018).
-  """
-  return SlayerGrad(alpha=alpha)(x)
+       g(x) = \begin{cases}
+          1, & x \geq 0 \\
+          0, & x < 0 \\
+          \end{cases}
+    Backward function:
+    .. math::
+       g'(x) = \exp(-\alpha |x|)
+    .. plot::
+       :include-source: True
+       >>> import jax
+       >>> import brainstate.nn as nn
+       >>> import brainstate as bst
+       >>> import matplotlib.pyplot as plt
+       >>> xs = jax.numpy.linspace(-3, 3, 1000)
+       >>> for alpha in [0.5, 1., 2., 4.]:
+       >>>   grads = bst.augment.vector_grad(bst.surrogate.slayer_grad)(xs, alpha)
+       >>>   plt.plot(xs, grads, label=r'$\alpha$=' + str(alpha))
+       >>> plt.legend()
+       >>> plt.show()
+    Parameters
+    ----------
+    x: jax.Array, Array
+      The input data.
+    alpha: float
+      Parameter to control smoothness of gradient
+    Returns
+    -------
+    out: jax.Array
+      The spiking state.
+    References
+    ----------
+    .. [1] Shrestha, S. B. & Orchard, G. Slayer: spike layer error reassignment in time. In Advances in Neural Information Processing Systems Vol. 31, 1412–1421 (NeurIPS, 2018).
+    """
+    return SlayerGrad(alpha=alpha)(x)

brainstate 0.0.2.post20241010__py2.py3-none-any.whl → 0.1.0__py2.py3-none-any.whl

brainstate 0.0.2.post20241010py2.py3-none-any.whl → 0.1.0py2.py3-none-any.whl