PyPI - brainstate - Versions diffs - 0.0.2.post20241010__py2.py3-none-any.whl → 0.1.0.post20241122__py2.py3-none-any.whl - Mend

brainstate 0.0.2.post20241010py2.py3-none-any.whl → 0.1.0.post20241122py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (184) hide show

benchmark/COBA_2005.py +125 -0
benchmark/CUBA_2005.py +149 -0
brainstate/__init__.py +31 -11
brainstate/_state.py +760 -316
brainstate/_state_test.py +41 -12
brainstate/_utils.py +31 -4
brainstate/augment/__init__.py +40 -0
brainstate/augment/_autograd.py +611 -0
brainstate/augment/_autograd_test.py +1193 -0
brainstate/augment/_eval_shape.py +102 -0
brainstate/augment/_eval_shape_test.py +40 -0
brainstate/augment/_mapping.py +525 -0
brainstate/augment/_mapping_test.py +210 -0
brainstate/augment/_random.py +99 -0
brainstate/{transform → compile}/__init__.py +25 -13
brainstate/compile/_ad_checkpoint.py +204 -0
brainstate/compile/_ad_checkpoint_test.py +51 -0
brainstate/compile/_conditions.py +259 -0
brainstate/compile/_conditions_test.py +221 -0
brainstate/compile/_error_if.py +94 -0
brainstate/compile/_error_if_test.py +54 -0
brainstate/compile/_jit.py +314 -0
brainstate/compile/_jit_test.py +143 -0
brainstate/compile/_loop_collect_return.py +516 -0
brainstate/compile/_loop_collect_return_test.py +59 -0
brainstate/compile/_loop_no_collection.py +185 -0
brainstate/compile/_loop_no_collection_test.py +51 -0
brainstate/compile/_make_jaxpr.py +756 -0
brainstate/compile/_make_jaxpr_test.py +134 -0
brainstate/compile/_progress_bar.py +111 -0
brainstate/compile/_unvmap.py +159 -0
brainstate/compile/_util.py +147 -0
brainstate/environ.py +408 -381
brainstate/environ_test.py +34 -32
brainstate/event/__init__.py +27 -0
brainstate/event/_csr.py +316 -0
brainstate/event/_csr_benchmark.py +14 -0
brainstate/event/_csr_test.py +118 -0
brainstate/event/_fixed_probability.py +708 -0
brainstate/event/_fixed_probability_benchmark.py +128 -0
brainstate/event/_fixed_probability_test.py +131 -0
brainstate/event/_linear.py +359 -0
brainstate/event/_linear_benckmark.py +82 -0
brainstate/event/_linear_test.py +117 -0
brainstate/{nn/event → event}/_misc.py +7 -7
brainstate/event/_xla_custom_op.py +312 -0
brainstate/event/_xla_custom_op_test.py +55 -0
brainstate/functional/_activations.py +521 -511
brainstate/functional/_activations_test.py +300 -300
brainstate/functional/_normalization.py +43 -43
brainstate/functional/_others.py +15 -15
brainstate/functional/_spikes.py +49 -49
brainstate/graph/__init__.py +33 -0
brainstate/graph/_graph_context.py +443 -0
brainstate/graph/_graph_context_test.py +65 -0
brainstate/graph/_graph_convert.py +246 -0
brainstate/graph/_graph_node.py +300 -0
brainstate/graph/_graph_node_test.py +75 -0
brainstate/graph/_graph_operation.py +1746 -0
brainstate/graph/_graph_operation_test.py +724 -0
brainstate/init/_base.py +28 -10
brainstate/init/_generic.py +175 -172
brainstate/init/_random_inits.py +470 -415
brainstate/init/_random_inits_test.py +150 -0
brainstate/init/_regular_inits.py +66 -69
brainstate/init/_regular_inits_test.py +51 -0
brainstate/mixin.py +236 -244
brainstate/mixin_test.py +44 -46
brainstate/nn/__init__.py +26 -51
brainstate/nn/_collective_ops.py +199 -0
brainstate/nn/_dyn_impl/__init__.py +46 -0
brainstate/nn/_dyn_impl/_dynamics_neuron.py +290 -0
brainstate/nn/_dyn_impl/_dynamics_neuron_test.py +162 -0
brainstate/nn/_dyn_impl/_dynamics_synapse.py +315 -0
brainstate/nn/_dyn_impl/_dynamics_synapse_test.py +132 -0
brainstate/nn/_dyn_impl/_inputs.py +154 -0
brainstate/nn/{event/__init__.py → _dyn_impl/_projection_alignpost.py} +8 -8
brainstate/nn/_dyn_impl/_rate_rnns.py +400 -0
brainstate/nn/_dyn_impl/_rate_rnns_test.py +64 -0
brainstate/nn/_dyn_impl/_readout.py +128 -0
brainstate/nn/_dyn_impl/_readout_test.py +54 -0
brainstate/nn/_dynamics/__init__.py +37 -0
brainstate/nn/_dynamics/_dynamics_base.py +631 -0
brainstate/nn/_dynamics/_dynamics_base_test.py +79 -0
brainstate/nn/_dynamics/_projection_base.py +346 -0
brainstate/nn/_dynamics/_state_delay.py +453 -0
brainstate/nn/_dynamics/_synouts.py +161 -0
brainstate/nn/_dynamics/_synouts_test.py +58 -0
brainstate/nn/_elementwise/__init__.py +22 -0
brainstate/nn/_elementwise/_dropout.py +418 -0
brainstate/nn/_elementwise/_dropout_test.py +100 -0
brainstate/nn/_elementwise/_elementwise.py +1122 -0
brainstate/nn/_elementwise/_elementwise_test.py +171 -0
brainstate/nn/_exp_euler.py +97 -0
brainstate/nn/_exp_euler_test.py +36 -0
brainstate/nn/_interaction/__init__.py +41 -0
brainstate/nn/_interaction/_conv.py +499 -0
brainstate/nn/_interaction/_conv_test.py +239 -0
brainstate/nn/_interaction/_embedding.py +59 -0
brainstate/nn/_interaction/_linear.py +582 -0
brainstate/nn/_interaction/_linear_test.py +42 -0
brainstate/nn/_interaction/_normalizations.py +388 -0
brainstate/nn/_interaction/_normalizations_test.py +75 -0
brainstate/nn/_interaction/_poolings.py +1179 -0
brainstate/nn/_interaction/_poolings_test.py +219 -0
brainstate/nn/_module.py +328 -0
brainstate/nn/_module_test.py +211 -0
brainstate/nn/metrics.py +309 -309
brainstate/optim/__init__.py +14 -2
brainstate/optim/_base.py +66 -0
brainstate/optim/_lr_scheduler.py +363 -400
brainstate/optim/_lr_scheduler_test.py +25 -24
brainstate/optim/_optax_optimizer.py +121 -176
brainstate/optim/_optax_optimizer_test.py +41 -1
brainstate/optim/_sgd_optimizer.py +950 -1025
brainstate/random/_rand_funs.py +3269 -3268
brainstate/random/_rand_funs_test.py +568 -0
brainstate/random/_rand_seed.py +149 -117
brainstate/random/_rand_seed_test.py +50 -0
brainstate/random/_rand_state.py +1356 -1321
brainstate/random/_random_for_unit.py +13 -13
brainstate/surrogate.py +1262 -1243
brainstate/{nn/_projection/_utils.py → transform.py} +1 -2
brainstate/typing.py +157 -130
brainstate/util/__init__.py +52 -0
brainstate/util/_caller.py +100 -0
brainstate/util/_dict.py +734 -0
brainstate/util/_dict_test.py +160 -0
brainstate/{nn/_projection/__init__.py → util/_error.py} +9 -13
brainstate/util/_filter.py +178 -0
brainstate/util/_others.py +497 -0
brainstate/util/_pretty_repr.py +208 -0
brainstate/util/_scaling.py +260 -0
brainstate/util/_struct.py +524 -0
brainstate/util/_tracers.py +75 -0
brainstate/{_visualization.py → util/_visualization.py} +16 -16
{brainstate-0.0.2.post20241010.dist-info → brainstate-0.1.0.post20241122.dist-info}/METADATA +11 -11
brainstate-0.1.0.post20241122.dist-info/RECORD +144 -0
{brainstate-0.0.2.post20241010.dist-info → brainstate-0.1.0.post20241122.dist-info}/top_level.txt +1 -0
brainstate/_module.py +0 -1637
brainstate/_module_test.py +0 -207
brainstate/nn/_base.py +0 -251
brainstate/nn/_connections.py +0 -686
brainstate/nn/_dynamics.py +0 -426
brainstate/nn/_elementwise.py +0 -1438
brainstate/nn/_embedding.py +0 -66
brainstate/nn/_misc.py +0 -133
brainstate/nn/_normalizations.py +0 -389
brainstate/nn/_others.py +0 -101
brainstate/nn/_poolings.py +0 -1229
brainstate/nn/_poolings_test.py +0 -231
brainstate/nn/_projection/_align_post.py +0 -546
brainstate/nn/_projection/_align_pre.py +0 -599
brainstate/nn/_projection/_delta.py +0 -241
brainstate/nn/_projection/_vanilla.py +0 -101
brainstate/nn/_rate_rnns.py +0 -410
brainstate/nn/_readout.py +0 -136
brainstate/nn/_synouts.py +0 -166
brainstate/nn/event/csr.py +0 -312
brainstate/nn/event/csr_test.py +0 -118
brainstate/nn/event/fixed_probability.py +0 -276
brainstate/nn/event/fixed_probability_test.py +0 -127
brainstate/nn/event/linear.py +0 -220
brainstate/nn/event/linear_test.py +0 -111
brainstate/random/random_test.py +0 -593
brainstate/transform/_autograd.py +0 -585
brainstate/transform/_autograd_test.py +0 -1181
brainstate/transform/_conditions.py +0 -334
brainstate/transform/_conditions_test.py +0 -220
brainstate/transform/_error_if.py +0 -94
brainstate/transform/_error_if_test.py +0 -55
brainstate/transform/_jit.py +0 -265
brainstate/transform/_jit_test.py +0 -118
brainstate/transform/_loop_collect_return.py +0 -502
brainstate/transform/_loop_no_collection.py +0 -170
brainstate/transform/_make_jaxpr.py +0 -739
brainstate/transform/_make_jaxpr_test.py +0 -131
brainstate/transform/_mapping.py +0 -109
brainstate/transform/_progress_bar.py +0 -111
brainstate/transform/_unvmap.py +0 -143
brainstate/util.py +0 -746
brainstate-0.0.2.post20241010.dist-info/RECORD +0 -87
{brainstate-0.0.2.post20241010.dist-info → brainstate-0.1.0.post20241122.dist-info}/LICENSE +0 -0
{brainstate-0.0.2.post20241010.dist-info → brainstate-0.1.0.post20241122.dist-info}/WHEEL +0 -0

brainstate/augment/_autograd.py ADDED Viewed

@@ -0,0 +1,611 @@
+# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""
+Gradient transformations are relatively simple compared to ``vmap`` or ``pmap`` augmentations.
+This is because the gradient transformations are not using the Jaxpr, instead, most of them are
+computed in the Python level. However, there is an exception, the ``checkpoint`` transformation,
+which has been moved into the ``compile`` module.
+The wrapped gradient transformations here are made possible by using the following ideas:
+1. All the states to compute the gradients should be known before the transformation.
+   There must be provided through the ``grad_states`` argument in any of the gradient transformations.
+2. The states that have been written in the function should be collected and updated after the function call.
+   We record these states during the function call and updated them after the function call.
+"""
+from __future__ import annotations
+import inspect
+from functools import partial, wraps
+from typing import Union, Callable, Dict, Sequence, Optional, Any, Tuple, TypeVar, Iterator
+import jax
+from jax import numpy as jnp
+from jax._src.api import _vjp
+from jax.api_util import argnums_partial
+from jax.extend import linear_util
+from brainstate._state import State, StateTraceStack
+from brainstate._utils import set_module_as
+from brainstate.typing import PyTree, Missing
+from brainstate.util import PrettyType, PrettyAttr, PrettyRepr
+__all__ = [
+    'GradientTransform', 'vector_grad', 'grad', 'jacrev', 'jacfwd', 'jacobian', 'hessian',
+]
+A = TypeVar('A')
+Gradient = PyTree
+LossValue = PyTree
+AuxData = PyTree
+def _isgeneratorfunction(fun):
+    # re-implemented here because of https://bugs.python.org/issue33261
+    while inspect.ismethod(fun):
+        fun = fun.__func__
+    while isinstance(fun, partial):
+        fun = fun.func
+    return inspect.isfunction(fun) and bool(fun.__code__.co_flags & inspect.CO_GENERATOR)
+def _check_callable(fun):
+    # In Python 3.10+, the only thing stopping us from supporting staticmethods
+    # is that we can't take weak references to them, which the C++ JIT requires.
+    if isinstance(fun, staticmethod):
+        raise TypeError(f"staticmethod arguments are not supported, got {fun}")
+    if not callable(fun):
+        raise TypeError(f"Expected a callable value, got {fun}")
+    if _isgeneratorfunction(fun):
+        raise TypeError(f"Expected a function, got a generator function: {fun}")
+def functional_vector_grad(func, argnums=0, return_value: bool = False, has_aux: bool = False):
+    """
+     Compute the gradient of a vector with respect to the input.
+     """
+    _check_callable(func)
+    @wraps(func)
+    def grad_fun(*args, **kwargs):
+        f = linear_util.wrap_init(func, kwargs)
+        f_partial, dyn_args = argnums_partial(f, argnums, args, require_static_args_hashable=False)
+        if has_aux:
+            y, vjp_fn, aux = _vjp(f_partial, *dyn_args, has_aux=True)
+        else:
+            y, vjp_fn = _vjp(f_partial, *dyn_args, has_aux=False)
+        leaves, tree = jax.tree.flatten(y)
+        tangents = jax.tree.unflatten(tree, [jnp.ones(l.shape, dtype=l.dtype) for l in leaves])
+        grads = vjp_fn(tangents)
+        if isinstance(argnums, int):
+            grads = grads[0]
+        if has_aux:
+            return (grads, y, aux) if return_value else (grads, aux)
+        else:
+            return (grads, y) if return_value else grads
+    return grad_fun
+def _jacrev(fun, argnums=0, holomorphic=False, allow_int=False, has_aux=False, return_value=False):
+    @wraps(fun)
+    def fun_wrapped(*args, **kwargs):
+        if has_aux:
+            y, aux = fun(*args, **kwargs)
+            if return_value:
+                return y, (y, aux)
+            else:
+                return y, aux
+        else:
+            y = fun(*args, **kwargs)
+            if return_value:
+                return y, y
+            else:
+                return y, None
+    transform = jax.jacrev(fun_wrapped, argnums=argnums, holomorphic=holomorphic, allow_int=allow_int, has_aux=True)
+    @wraps(fun)
+    def jacfun(*args, **kwargs):
+        jac, aux = transform(*args, **kwargs)
+        if return_value:
+            return (jac, aux[0], aux[1]) if has_aux else (jac, aux)
+        else:
+            return (jac, aux) if has_aux else jac
+    return jacfun
+def _jacfwd(fun, argnums=0, holomorphic=False, has_aux=False, return_value=False):
+    @wraps(fun)
+    def fun_wrapped(*args, **kwargs):
+        if has_aux:
+            y, aux = fun(*args, **kwargs)
+            if return_value:
+                return y, (y, aux)
+            else:
+                return y, aux
+        else:
+            y = fun(*args, **kwargs)
+            if return_value:
+                return y, y
+            else:
+                return y, None
+    transform = jax.jacfwd(fun_wrapped, argnums=argnums, holomorphic=holomorphic, has_aux=True)
+    @wraps(fun)
+    def jacfun(*args, **kwargs):
+        jac, aux = transform(*args, **kwargs)
+        if return_value:
+            return (jac, aux[0], aux[1]) if has_aux else (jac, aux)
+        else:
+            return (jac, aux) if has_aux else jac
+    return jacfun
+TransformFn = Callable
+class GradientTransform(PrettyRepr):
+    """
+    Automatic Differentiation Transformations for the ``State`` system.
+    """
+    __module__ = "brainstate.augment"
+    def __init__(
+        self,
+        target: Callable,
+        transform: TransformFn,
+        grad_states: Optional[Union[State, Sequence[State], Dict[str, State]]] = None,
+        argnums: Optional[Union[int, Sequence[int]]] = None,
+        return_value: bool = False,
+        has_aux: bool = False,
+        transform_params: Optional[Dict[str, Any]] = None,
+    ):
+        # gradient variables
+        if isinstance(grad_states, dict):
+            grad_states = {k: v for k, v in grad_states.items()}
+        self._grad_states, self._grad_tree = jax.tree.flatten(grad_states)
+        if any(not isinstance(v, State) for v in self._grad_states):
+            raise TypeError("All grad_states must be State instances.")
+        # parameters
+        if argnums is None and len(self._grad_states) == 0:
+            argnums = 0
+        if argnums is None:
+            assert len(self._grad_states) > 0
+            _argnums = 0
+        elif isinstance(argnums, int):
+            _argnums = (0, argnums + 1) if len(self._grad_states) > 0 else (argnums + 1)
+        else:
+            assert isinstance(argnums, (tuple, list))
+            _argnums = tuple(a + 1 for a in argnums)
+            if len(self._grad_states) > 0:
+                _argnums = (0,) + _argnums
+        self._nonvar_argnums = argnums
+        self._argnums = _argnums
+        self._return_value = return_value
+        self._has_aux = has_aux
+        # target
+        self.target = target
+        # transform
+        self._states_to_be_written: Tuple[State, ...] = None
+        _grad_setting = dict() if transform_params is None else transform_params
+        if self._has_aux:
+            self._transform = transform(self._fun_with_aux, argnums=self._argnums, has_aux=True, **_grad_setting)
+        else:
+            self._transform = transform(self._fun_without_aux, argnums=self._argnums, has_aux=True, **_grad_setting)
+    def __pretty_repr__(self) -> Iterator[Union[PrettyType, PrettyAttr]]:
+        yield PrettyType(self.__class__.__name__)
+        yield PrettyAttr("target", self.target)
+        yield PrettyAttr("grad_states", self._grad_states)
+        yield PrettyAttr("grad_tree", self._grad_tree)
+        yield PrettyAttr("argnums", self._nonvar_argnums)
+        yield PrettyAttr("return_value", self._return_value)
+        yield PrettyAttr("has_aux", self._has_aux)
+        yield PrettyAttr("transform", self._transform)
+    def _call_target(self, *args, **kwargs):
+        if self._states_to_be_written is None:
+            with StateTraceStack() as stack:
+                output = self.target(*args, **kwargs)
+                # grad_ids = set([id(v) for v in self._grad_states])
+                # self._states_to_be_written = [st for st in stack.get_write_states() if id(st) not in grad_ids]
+                self._states_to_be_written = [st for st in stack.get_write_states()]
+        else:
+            output = self.target(*args, **kwargs)
+        return output
+    def _fun_with_aux(self, grad_values: tuple, *args, **kwargs):
+        for v, d in zip(self._grad_states, grad_values):
+            v.restore_value(d)
+        # Users should return the auxiliary data like::
+        # >>> # 1. example of return one data
+        # >>> return scalar_loss, data
+        # >>> # 2. example of return multiple data
+        # >>> return scalar_loss, (data1, data2, ...)
+        outs = self._call_target(*args, **kwargs)
+        # outputs: [0] is the value for gradient,
+        #          [1] is other values for return
+        assert self._states_to_be_written is not None, "The states to be written should be collected."
+        return outs[0], (outs, [v.value for v in self._grad_states], [v.value for v in self._states_to_be_written])
+    def _fun_without_aux(self, grad_values: tuple, *args, **kwargs):
+        for v, d in zip(self._grad_states, grad_values):
+            v.restore_value(d)
+        # Users should return the scalar value like this::
+        # >>> return scalar_loss
+        out = self._call_target(*args, **kwargs)
+        assert self._states_to_be_written is not None, "The states to be written should be collected."
+        return out, (out, [v.value for v in self._grad_states], [v.value for v in self._states_to_be_written])
+    def _return(self, rets):
+        grads, (outputs, new_grad_vals, new_dyn_vals) = rets
+        for i, val in enumerate(new_grad_vals):
+            self._grad_states[i].restore_value(val)
+        for i, val in enumerate(new_dyn_vals):
+            self._states_to_be_written[i].value = val
+        # check returned grads
+        if len(self._grad_states) > 0:
+            if self._nonvar_argnums is None:
+                grads = self._grad_tree.unflatten(grads)
+            else:
+                var_grads = self._grad_tree.unflatten(grads[0])
+                arg_grads = grads[1] if isinstance(self._nonvar_argnums, int) else grads[1:]
+                grads = (var_grads, arg_grads)
+        # check returned value
+        if self._return_value:
+            # check aux
+            if self._has_aux:
+                return grads, outputs[0], outputs[1]
+            else:
+                return grads, outputs
+        else:
+            # check aux
+            if self._has_aux:
+                return grads, outputs[1]
+            else:
+                return grads
+    def __call__(
+        self, *args, **kwargs
+    ) -> Gradient | Tuple[Gradient, LossValue] | Tuple[Gradient, AuxData] | Tuple[Gradient, LossValue, AuxData]:
+        rets = self._transform([v.value for v in self._grad_states], *args, **kwargs)
+        return self._return(rets)
+_doc_of_return = '''
+    1. When ``grad_states`` is None
+        - ``has_aux=False`` + ``return_value=False`` => ``arg_grads``.
+        - ``has_aux=True`` + ``return_value=False`` => ``(arg_grads, aux_data)``.
+        - ``has_aux=False`` + ``return_value=True`` => ``(arg_grads, loss_value)``.
+        - ``has_aux=True`` + ``return_value=True`` => ``(arg_grads, loss_value, aux_data)``.
+    2. When ``grad_states`` is not None and ``argnums`` is None
+        - ``has_aux=False`` + ``return_value=False`` => ``var_grads``.
+        - ``has_aux=True`` + ``return_value=False`` => ``(var_grads, aux_data)``.
+        - ``has_aux=False`` + ``return_value=True`` => ``(var_grads, loss_value)``.
+        - ``has_aux=True`` + ``return_value=True`` => ``(var_grads, loss_value, aux_data)``.
+    3. When ``grad_states`` is not None and ``argnums`` is not None
+        - ``has_aux=False`` + ``return_value=False`` => ``(var_grads, arg_grads)``.
+        - ``has_aux=True`` + ``return_value=False`` => ``((var_grads, arg_grads), aux_data)``.
+        - ``has_aux=False`` + ``return_value=True`` => ``((var_grads, arg_grads), loss_value)``.
+        - ``has_aux=True`` + ``return_value=True`` => ``((var_grads, arg_grads), loss_value, aux_data)``.
+'''
+@set_module_as("brainstate.augment")
+def grad(
+    fun: Callable = Missing(),
+    grad_states: Optional[Union[State, Sequence[State], Dict[str, State]]] = None,
+    argnums: Optional[Union[int, Sequence[int]]] = None,
+    holomorphic: Optional[bool] = False,
+    allow_int: Optional[bool] = False,
+    reduce_axes: Optional[Sequence[str]] = (),
+    has_aux: Optional[bool] = None,
+    return_value: Optional[bool] = False,
+) -> GradientTransform | Callable[[Callable], GradientTransform]:
+    """
+    Compute the gradient of a scalar-valued function with respect to its arguments.
+    %s
+    Args:
+      fun: callable. the scalar-valued function to be differentiated.
+      reduce_axes: (Sequence[str]) optional. Specifies the axes to reduce over when
+        differentiating with respect to array-valued arguments. The default, (),
+        means to differentiate each element of the output with respect to each
+        element of the argument. If the argument is an array, this argument controls
+        how many axes the output of grad has.
+      allow_int: (bool) optional. Whether to allow differentiating with respect to
+        integer valued inputs. The gradient of an integer input will have a trivial
+        vector-space dtype (float0). Default False.
+      holomorphic: (bool) optional. Whether fun is promised to be holomorphic.
+        Default False.
+      grad_states: (State, Sequence[State], Dict[str, State]) optional. The variables
+        in fun to take their gradients.
+      fun: the scalar-valued function to be differentiated.
+      argnums: (int or tuple of ints) optional. Specifies which positional
+        argument(s) to differentiate with respect to.
+      has_aux: (bool) optional. Indicates whether fun returns a pair where the
+        first element is considered the output of the mathematical function to be
+        differentiated and the second element is auxiliary data. Default False.
+      return_value: (bool) optional. Indicates whether to return the value of the
+        function along with the gradient. Default False.
+    Returns:
+      A function which computes the gradient of fun. The function takes the same
+      arguments as `fun`, but returns the gradient instead. If `has_aux` is True,
+      the function returns a pair where the first element is the gradient and the
+      second element is the auxiliary data. If `return_value` is True, the function
+      returns a pair where the first element is the gradient and the second element
+      is the value of the function.
+    """
+    if isinstance(fun, Missing):
+        def transform(fun) -> GradientTransform:
+            return GradientTransform(target=fun,
+                                     transform=jax.grad,
+                                     grad_states=grad_states,
+                                     argnums=argnums,
+                                     return_value=return_value,
+                                     has_aux=False if has_aux is None else has_aux,
+                                     transform_params=dict(holomorphic=holomorphic,
+                                                           allow_int=allow_int,
+                                                           reduce_axes=reduce_axes))
+        return transform
+    return GradientTransform(target=fun,
+                             transform=jax.grad,
+                             grad_states=grad_states,
+                             argnums=argnums,
+                             return_value=return_value,
+                             has_aux=False if has_aux is None else has_aux,
+                             transform_params=dict(holomorphic=holomorphic,
+                                                   allow_int=allow_int,
+                                                   reduce_axes=reduce_axes))
+grad.__doc__ = grad.__doc__ % _doc_of_return
+@set_module_as("brainstate.augment")
+def vector_grad(
+    func: Callable = Missing(),
+    grad_states: Optional[Union[State, Sequence[State], Dict[str, State]]] = None,
+    argnums: Optional[Union[int, Sequence[int]]] = None,
+    return_value: bool = False,
+    has_aux: Optional[bool] = None,
+) -> GradientTransform | Callable[[Callable], GradientTransform]:
+    """Take vector-valued gradients for function ``func``.
+    Same as :py:func:`grad`, :py:func:`jacrev`, and :py:func:`jacfwd`,
+    the returns in this function are different for different argument settings.
+    %s
+    Parameters
+    ----------
+    func: Callable
+      Function whose gradient is to be computed.
+    grad_states : optional, ArrayType, sequence of ArrayType, dict
+      The variables in ``func`` to take their gradients.
+    has_aux: optional, bool
+      Indicates whether ``fun`` returns a pair where the
+      first element is considered the output of the mathematical function to be
+      differentiated and the second element is auxiliary data. Default False.
+    return_value : bool
+      Whether return the loss value.
+    argnums: Optional, integer or sequence of integers. Specifies which
+      positional argument(s) to differentiate with respect to (default ``0``).
+    Returns
+    -------
+    func : GradientTransform
+      The vector gradient function.
+    """
+    if isinstance(func, Missing):
+        def transform(fun) -> GradientTransform:
+            return GradientTransform(target=fun,
+                                     transform=functional_vector_grad,
+                                     grad_states=grad_states,
+                                     argnums=argnums,
+                                     return_value=return_value,
+                                     has_aux=False if has_aux is None else has_aux)
+        return transform
+    else:
+        return GradientTransform(target=func,
+                                 transform=functional_vector_grad,
+                                 grad_states=grad_states,
+                                 argnums=argnums,
+                                 return_value=return_value,
+                                 has_aux=False if has_aux is None else has_aux)
+vector_grad.__doc__ = vector_grad.__doc__ % _doc_of_return
+@set_module_as("brainstate.augment")
+def jacrev(
+    fun: Callable,
+    grad_states: Optional[Union[State, Sequence[State], Dict[str, State]]] = None,
+    argnums: Optional[Union[int, Sequence[int]]] = None,
+    has_aux: Optional[bool] = None,
+    return_value: bool = False,
+    holomorphic: bool = False,
+    allow_int: bool = False,
+) -> GradientTransform:
+    """
+    Extending automatic Jacobian (reverse-mode) of ``func`` to classes.
+    This function extends the JAX official ``jacrev`` to make automatic jacobian
+    computation on functions and class functions. Moreover, it supports returning
+    value ("return_value") and returning auxiliary data ("has_aux").
+    %s
+    Parameters
+    ----------
+    fun: Function whose Jacobian is to be computed.
+    grad_states : optional, ArrayType, sequence of ArrayType, dict
+      The variables in ``func`` to take their gradients.
+    has_aux: optional, bool
+      Indicates whether ``fun`` returns a pair where the
+      first element is considered the output of the mathematical function to be
+      differentiated and the second element is auxiliary data. Default False.
+    return_value : bool
+      Whether return the loss value.
+    argnums: Optional, integer or sequence of integers.
+      Specifies which
+      positional argument(s) to differentiate with respect to (default ``0``).
+    holomorphic: Optional, bool.
+      Indicates whether ``fun`` is promised to be
+      holomorphic. Default False.
+    allow_int: Optional, bool.
+      Whether to allow differentiating with
+      respect to integer valued inputs. The gradient of an integer input will
+      have a trivial vector-space dtype (float0). Default False.
+    Returns
+    -------
+    fun: GradientTransform
+      The transformed object.
+    """
+    return GradientTransform(target=fun,
+                             transform=_jacrev,
+                             grad_states=grad_states,
+                             argnums=argnums,
+                             return_value=return_value,
+                             has_aux=False if has_aux is None else has_aux,
+                             transform_params=dict(holomorphic=holomorphic,
+                                                   allow_int=allow_int))
+jacrev.__doc__ = jacrev.__doc__ % _doc_of_return
+jacobian = jacrev
+@set_module_as("brainstate.augment")
+def jacfwd(
+    func: Callable,
+    grad_states: Optional[Union[State, Sequence[State], Dict[str, State]]] = None,
+    argnums: Optional[Union[int, Sequence[int]]] = None,
+    has_aux: Optional[bool] = None,
+    return_value: bool = False,
+    holomorphic: bool = False,
+) -> GradientTransform:
+    """Extending automatic Jacobian (forward-mode) of ``func`` to classes.
+    This function extends the JAX official ``jacfwd`` to make automatic jacobian
+    computation on functions and class functions. Moreover, it supports returning
+    value ("return_value") and returning auxiliary data ("has_aux").
+    %s
+    Parameters
+    ----------
+    func: Function whose Jacobian is to be computed.
+    grad_states : optional, ArrayType, sequence of ArrayType, dict
+      The variables in ``func`` to take their gradients.
+    has_aux: optional, bool
+      Indicates whether ``fun`` returns a pair where the
+      first element is considered the output of the mathematical function to be
+      differentiated and the second element is auxiliary data. Default False.
+    return_value : bool
+      Whether return the loss value.
+    argnums: Optional, integer or sequence of integers. Specifies which
+      positional argument(s) to differentiate with respect to (default ``0``).
+    holomorphic: Optional, bool. Indicates whether ``fun`` is promised to be
+      holomorphic. Default False.
+    Returns
+    -------
+    obj: GradientTransform
+      The transformed object.
+    """
+    return GradientTransform(target=func,
+                             transform=_jacfwd,
+                             grad_states=grad_states,
+                             argnums=argnums,
+                             return_value=return_value,
+                             has_aux=False if has_aux is None else has_aux,
+                             transform_params=dict(holomorphic=holomorphic))
+jacfwd.__doc__ = jacfwd.__doc__ % _doc_of_return
+@set_module_as("brainstate.augment")
+def hessian(
+    func: Callable,
+    grad_states: Optional[Union[State, Sequence[State], Dict[str, State]]] = None,
+    argnums: Optional[Union[int, Sequence[int]]] = None,
+    has_aux: bool = False,
+    return_value: bool = False,
+    holomorphic: bool = False,
+) -> GradientTransform:
+    """
+    Hessian of ``func`` as a dense array.
+    %s
+    Parameters
+    ----------
+    func : callable
+      Function whose Hessian is to be computed.  Its arguments at positions
+      specified by ``argnums`` should be arrays, scalars, or standard Python
+      containers thereof. It should return arrays, scalars, or standard Python
+      containers thereof.
+    grad_states : optional, ArrayCollector, sequence of ArrayType
+      The variables required to compute their gradients.
+    argnums: Optional, integer or sequence of integers
+      Specifies which positional argument(s) to differentiate with respect to (default ``0``).
+    holomorphic : bool
+      Indicates whether ``fun`` is promised to be holomorphic. Default False.
+    return_value : bool
+      Whether return the hessian values.
+    Returns
+    -------
+    obj: ObjectTransform
+      The transformed object.
+    """
+    return GradientTransform(target=func,
+                             transform=jax.hessian,
+                             grad_states=grad_states,
+                             argnums=argnums,
+                             return_value=return_value,
+                             has_aux=False if has_aux is None else has_aux,
+                             transform_params=dict(holomorphic=holomorphic))
+hessian.__doc__ = hessian.__doc__ % _doc_of_return

brainstate 0.0.2.post20241010__py2.py3-none-any.whl → 0.1.0.post20241122__py2.py3-none-any.whl

brainstate 0.0.2.post20241010py2.py3-none-any.whl → 0.1.0.post20241122py2.py3-none-any.whl