PyPI - brainstate - Versions diffs - 0.1.0.post20250212__py2.py3-none-any.whl → 0.1.0.post20250217__py2.py3-none-any.whl - Mend

brainstate 0.1.0.post20250212py2.py3-none-any.whl → 0.1.0.post20250217py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (97) hide show

brainstate/_state.py +853 -90
brainstate/_state_test.py +1 -3
brainstate/augment/__init__.py +2 -2
brainstate/augment/_autograd.py +257 -115
brainstate/augment/_autograd_test.py +2 -3
brainstate/augment/_eval_shape.py +3 -4
brainstate/augment/_mapping.py +582 -62
brainstate/augment/_mapping_test.py +114 -30
brainstate/augment/_random.py +61 -7
brainstate/compile/_ad_checkpoint.py +2 -3
brainstate/compile/_conditions.py +4 -5
brainstate/compile/_conditions_test.py +1 -2
brainstate/compile/_error_if.py +1 -2
brainstate/compile/_error_if_test.py +1 -2
brainstate/compile/_jit.py +23 -16
brainstate/compile/_jit_test.py +1 -2
brainstate/compile/_loop_collect_return.py +18 -10
brainstate/compile/_loop_collect_return_test.py +1 -1
brainstate/compile/_loop_no_collection.py +5 -5
brainstate/compile/_make_jaxpr.py +23 -21
brainstate/compile/_make_jaxpr_test.py +1 -2
brainstate/compile/_progress_bar.py +1 -2
brainstate/compile/_unvmap.py +1 -0
brainstate/compile/_util.py +4 -2
brainstate/environ.py +4 -4
brainstate/environ_test.py +1 -2
brainstate/functional/_activations.py +1 -2
brainstate/functional/_activations_test.py +1 -1
brainstate/functional/_normalization.py +1 -2
brainstate/functional/_others.py +1 -2
brainstate/functional/_spikes.py +136 -20
brainstate/graph/_graph_node.py +2 -43
brainstate/graph/_graph_operation.py +4 -20
brainstate/graph/_graph_operation_test.py +3 -4
brainstate/init/_base.py +1 -2
brainstate/init/_generic.py +1 -2
brainstate/nn/__init__.py +8 -0
brainstate/nn/_collective_ops.py +351 -48
brainstate/nn/_collective_ops_test.py +36 -0
brainstate/nn/_common.py +193 -0
brainstate/nn/_dyn_impl/_dynamics_neuron.py +1 -2
brainstate/nn/_dyn_impl/_dynamics_neuron_test.py +1 -2
brainstate/nn/_dyn_impl/_dynamics_synapse.py +1 -2
brainstate/nn/_dyn_impl/_dynamics_synapse_test.py +1 -2
brainstate/nn/_dyn_impl/_inputs.py +1 -2
brainstate/nn/_dyn_impl/_rate_rnns.py +1 -2
brainstate/nn/_dyn_impl/_rate_rnns_test.py +1 -2
brainstate/nn/_dyn_impl/_readout.py +2 -3
brainstate/nn/_dyn_impl/_readout_test.py +1 -2
brainstate/nn/_dynamics/_dynamics_base.py +6 -1
brainstate/nn/_dynamics/_dynamics_base_test.py +1 -2
brainstate/nn/_dynamics/_state_delay.py +3 -3
brainstate/nn/_dynamics/_synouts_test.py +1 -2
brainstate/nn/_elementwise/_dropout.py +6 -7
brainstate/nn/_elementwise/_dropout_test.py +1 -2
brainstate/nn/_elementwise/_elementwise.py +1 -2
brainstate/nn/_exp_euler.py +1 -2
brainstate/nn/_exp_euler_test.py +1 -2
brainstate/nn/_interaction/_conv.py +1 -2
brainstate/nn/_interaction/_conv_test.py +1 -0
brainstate/nn/_interaction/_linear.py +1 -2
brainstate/nn/_interaction/_linear_test.py +1 -2
brainstate/nn/_interaction/_normalizations.py +1 -2
brainstate/nn/_interaction/_poolings.py +3 -4
brainstate/nn/_module.py +68 -19
brainstate/nn/_module_test.py +1 -2
brainstate/nn/_utils.py +89 -0
brainstate/nn/metrics.py +3 -4
brainstate/optim/_lr_scheduler.py +1 -2
brainstate/optim/_lr_scheduler_test.py +2 -3
brainstate/optim/_optax_optimizer_test.py +1 -2
brainstate/optim/_sgd_optimizer.py +2 -3
brainstate/random/_rand_funs.py +1 -2
brainstate/random/_rand_funs_test.py +2 -3
brainstate/random/_rand_seed.py +2 -3
brainstate/random/_rand_seed_test.py +1 -2
brainstate/random/_rand_state.py +3 -4
brainstate/surrogate.py +5 -5
brainstate/transform.py +0 -3
brainstate/typing.py +28 -25
brainstate/util/__init__.py +9 -7
brainstate/util/_caller.py +1 -2
brainstate/util/_error.py +27 -0
brainstate/util/_others.py +60 -15
brainstate/util/{_dict.py → _pretty_pytree.py} +2 -2
brainstate/util/{_dict_test.py → _pretty_pytree_test.py} +1 -2
brainstate/util/_pretty_repr.py +1 -2
brainstate/util/_pretty_table.py +2900 -0
brainstate/util/_struct.py +11 -11
brainstate/util/filter.py +472 -0
{brainstate-0.1.0.post20250212.dist-info → brainstate-0.1.0.post20250217.dist-info}/METADATA +2 -2
brainstate-0.1.0.post20250217.dist-info/RECORD +128 -0
brainstate/util/_filter.py +0 -178
brainstate-0.1.0.post20250212.dist-info/RECORD +0 -124
{brainstate-0.1.0.post20250212.dist-info → brainstate-0.1.0.post20250217.dist-info}/LICENSE +0 -0
{brainstate-0.1.0.post20250212.dist-info → brainstate-0.1.0.post20250217.dist-info}/WHEEL +0 -0
{brainstate-0.1.0.post20250212.dist-info → brainstate-0.1.0.post20250217.dist-info}/top_level.txt +0 -0

brainstate/augment/_mapping.py CHANGED Viewed

@@ -16,15 +16,26 @@
 from __future__ import annotations
 import functools
-from typing import Any, TypeVar, Callable, Hashable, Sequence, Iterable, Tuple, Union, Optional, Dict, List
 import jax
 from jax.interpreters.batching import BatchTracer
-from brainstate._state import State, StateTraceStack
-from brainstate.compile._loop_collect_return import scan
-from brainstate.random import DEFAULT, RandomState
-from brainstate.typing import Missing
+from typing import (
+    Any,
+    TypeVar,
+    Callable,
+    Hashable,
+    Sequence,
+    Iterable,
+    Tuple,
+    Union,
+    Optional,
+    Dict,
+    List
+)
+from brainstate._state import State, catch_new_states
+from brainstate.compile import scan, StatefulFunction
+from brainstate.random import RandomState, DEFAULT
+from brainstate.typing import Missing, Filter
 from brainstate.util import NestedDict, BrainStateError
 from ._random import restore_rngs
@@ -32,21 +43,56 @@ __all__ = [
     'vmap',
     'pmap',
     'map',
+    'vmap_new_states',
 ]
-AxisName = Hashable
 F = TypeVar("F", bound=Callable)
+AxisName = Hashable
 AxisToState = Dict[int, List[State]]
 StateToAxis = Dict[State, int]
 class BatchAxisError(BrainStateError):
+    """
+    Exception raised for errors related to batch axis operations.
+    This custom exception is used to indicate errors that occur during
+    batch processing or vectorization operations, particularly in the
+    context of state management in the BrainState framework.
+    Inherits from:
+        BrainStateError: The base error class for BrainState-related exceptions.
+    """
     pass
 def _flatten_in_out_states(
     in_states: Dict[int, Dict] | Any = None,
 ) -> Tuple[AxisToState, StateToAxis]:
+    """
+    Flattens and organizes input or output states into axis-based mappings.
+    This function processes the input or output states, converting them into two
+    dictionary representations: one mapping axes to states, and another mapping
+    states to axes. It handles both structured (Dict[int, Dict]) and unstructured
+    input formats.
+    Args:
+        in_states (Dict[int, Dict] | Any, optional): The input or output states to be
+            flattened. Can be a nested dictionary structure where the outer keys are
+            axes and inner dictionaries contain states, or any other structure
+            containing states. Defaults to None.
+    Returns:
+        Tuple[AxisToState, StateToAxis]: A tuple containing two dictionaries:
+            - AxisToState: Maps axes (int) to lists of states.
+            - StateToAxis: Maps individual states to their corresponding axes (int).
+    Note:
+        If in_states is None, empty dictionaries are returned for both mappings.
+        If in_states is not in the expected Dict[int, Dict] format, all states are
+        assigned to axis 0.
+    """
     if in_states is None:
         return dict(), dict()
     if isinstance(in_states, dict):
@@ -72,16 +118,165 @@ def _flatten_in_out_states(
         return axis_to_states, state_to_axis
-def _vmap_transform(
-    f: F,
-    *,
-    in_axes: int | None | Sequence[Any] = 0,
-    out_axes: Any = 0,
-    in_states: Dict[int, Dict] | Any | None = None,
-    out_states: Dict[int, Dict] | Any | None = None,
-    rngs: Union[RandomState, Sequence[RandomState]] = DEFAULT,
-    **transform_kwargs,
+def _remove_axis(x, axis: int):
+    """
+    Remove a specified axis from an array or nested structure.
+    This function removes a specified axis from an array or nested structure,
+    adjusting the shape and structure of the output accordingly.
+    Args:
+        x (Any): The input array or nested structure to remove the axis from.
+        axis (int): The axis to remove from the input.
+    Returns:
+        Any: The output array or nested structure with the specified axis removed.
+    """
+    assert isinstance(axis, int), f"Expected axis to be an integer, but got {type(axis)}"
+    if axis < 0:
+        axis += x.ndim
+    if axis < 0 or axis >= x.ndim:
+        raise IndexError(f"Axis {axis} is out of bounds for array of shape {x.shape}")
+    return x[tuple(slice(None, None, None) if i != axis else 0 for i in range(x.ndim))]
+def _compile_stateful_function(
+    stateful_fn: StatefulFunction,
+    in_axes: int | Tuple[int, ...],
+    args: Tuple
+):
+    """
+    Compile a stateful function with specified input axes and arguments.
+    This function prepares and compiles a stateful function for vectorized mapping (vmap)
+    by adjusting the input arguments based on the specified axes and then generating
+    the function's JAX program representation (jaxpr).
+    Args:
+        stateful_fn (StatefulFunction): The stateful function to be compiled.
+        in_axes (int | Tuple[int, ...]): Specifies which axes of the input arguments
+            to map over. Can be a single integer (same for all args) or a tuple of integers.
+        args (Tuple): The input arguments to the function.
+    Raises:
+        ValueError: If the length of in_axes tuple doesn't match the number of arguments.
+    Returns:
+        None. The function modifies the stateful_fn in-place by calling make_jaxpr.
+    """
+    in_axes_st, in_axes = in_axes
+    state_vals, args = args
+    # check in_axes
+    if isinstance(in_axes, tuple) and len(in_axes) != len(args):
+        raise ValueError(
+            "vmap in_axes must be an int, None, or a tuple of entries corresponding "
+            "to the positional arguments passed to the function, "
+            f"but got {len(in_axes)=}, {len(args)=}"
+        )
+    # check state_vals
+    if len(state_vals) > 0:
+        state_vals = [jax.tree.map(lambda x: _remove_axis(x, axis), vals)
+                      for vals, axis in zip(state_vals, in_axes_st)]
+    else:
+        state_vals = []
+    if isinstance(in_axes, int):
+        args = jax.tree.map(lambda x: _remove_axis(x, in_axes), args)
+    elif isinstance(in_axes, tuple):
+        args = tuple(
+            [arg if in_axis is None else _remove_axis(arg, in_axis)
+             for arg, in_axis in zip(args, in_axes)]
+        )
+    stateful_fn.make_jaxpr(state_vals, args)
+    return stateful_fn.get_arg_cache_key(state_vals, args)
+def _get_batch_size(
+    args: Tuple,
+    in_axes: int | Tuple[int, ...],
+    in_states: AxisToState,
+    axis_size: Optional[int] = None,
+) -> int:
+    """
+    Determine the batch size from input arguments, axes, and states.
+    This function calculates the batch size by examining the shapes of input arguments
+    and states along specified axes. It ensures consistency across all inputs.
+    Args:
+        args (Tuple): The input arguments to the function being vectorized.
+        in_axes (int | Tuple[int, ...]): The axes along which to vectorize for each argument.
+            Can be a single integer (same for all args) or a tuple of integers.
+        in_states (AxisToState): A dictionary mapping axes to lists of states.
+    Returns:
+        int: The determined batch size.
+    Raises:
+        ValueError: If unable to determine batch size or if inconsistent batch sizes are found.
+    """
+    batch_sizes = []
+    # Check batch size from args and in_axes
+    if isinstance(in_axes, int):
+        in_axes = (in_axes,) * len(args)
+    for arg, in_axis in zip(args, in_axes):
+        if in_axis is not None:
+            arg_leaves = jax.tree.leaves(arg)
+            if arg_leaves:
+                batch_sizes.append(arg_leaves[0].shape[in_axis])
+    # Check batch size from in_states
+    if in_states is not None:
+        for axis, states in in_states.items():
+            for state in states:
+                state_leaves = jax.tree.leaves(state.value)
+                if len(state_leaves):
+                    batch_sizes.append(state_leaves[0].shape[axis])
+    if len(batch_sizes) == 0:
+        assert axis_size is not None, (
+            "Unable to determine batch size. Please provide the 'axis_size' argument."
+        )
+        return axis_size
+    else:
+        # Ensure all batch sizes are consistent
+        if len(set(batch_sizes)) > 1:
+            raise ValueError(f"Inconsistent batch sizes found: {set(batch_sizes)}")
+        return batch_sizes[0]
+def _format_state_axes(
+    in_states,
+    out_states,
 ):
+    """
+    Format and validate the axes of input and output states.
+    This function processes the input and output states, ensuring consistency
+    between their axis mappings. It also handles cases where a state appears
+    in the input but not in the output.
+    Args:
+        in_states: The input states to be formatted. Can be a dictionary mapping
+                   axes to states, or any other structure containing states.
+        out_states: The output states to be formatted. Can be a dictionary mapping
+                    axes to states, or any other structure containing states.
+    Returns:
+        A tuple containing four elements:
+        - axis_to_in_states (dict): Mapping of axes to input states.
+        - in_state_to_axis (dict): Mapping of input states to their axes.
+        - axis_to_out_states (dict): Mapping of axes to output states.
+        - out_state_to_axis (dict): Mapping of output states to their axes.
+    Raises:
+        BatchAxisError: If there's an inconsistency between the axis mappings
+                        of input and output states.
+    """
     axis_to_in_states, in_state_to_axis = _flatten_in_out_states(in_states)
     axis_to_out_states, out_state_to_axis = _flatten_in_out_states(out_states)
     for _in_state, _axis in in_state_to_axis.items():
@@ -90,8 +285,8 @@ def _vmap_transform(
             if _out_axis != _axis:
                 _in_state.raise_error_with_source_info(
                     BatchAxisError(
-                        f"State {_in_state} has been mapped to axis {_axis} in in_states, "
-                        f"However, it is mapped to axis {_out_axis} in out_states."
+                        f"State {_in_state} has been mapped to axis {_axis} in 'in_states', "
+                        f"However, it is mapped to axis {_out_axis} in 'out_states'."
                     )
                 )
         else:
@@ -99,65 +294,286 @@ def _vmap_transform(
             if _axis not in axis_to_out_states:
                 axis_to_out_states[_axis] = []
             axis_to_out_states[_axis].append(_in_state)
-    if isinstance(rngs, RandomState):
-        rngs = (rngs,)
-    rng_ids = set([id(rng) for rng in rngs])
-    @functools.wraps(f)
-    def new_fn(in_states_, args):
+    return axis_to_in_states, in_state_to_axis, axis_to_out_states, out_state_to_axis
+def _vmap_transform(
+    f: F,
+    *,
+    in_axes: int | None | Sequence[Any] = 0,
+    out_axes: Any = 0,
+    in_states: Dict[int, Dict] | Any | None = None,
+    out_states: Dict[int, Dict] | Any | None = None,
+    axis_size: Optional[int] = None,
+    axis_name: AxisName | None = None,
+    spmd_axis_name: AxisName | tuple[AxisName, ...] | None = None,
+):
+    """
+    Transforms a function for vectorized mapping (vmap) with state management.
+    This internal function applies vectorized mapping to the input function while
+    handling state management for input and output states. It supports custom
+    axis specifications for both inputs and outputs.
+    Args:
+        f (F): The function to be transformed for vectorized mapping.
+        in_axes (int | None | Sequence[Any]): Specifies which axes of the input
+            arguments to map over. Default is 0.
+        out_axes (Any): Specifies where the mapped axis should appear in the output.
+            Default is 0.
+        in_states (Dict[int, Dict] | Any | None): Specifies the input states and
+            their corresponding axes for mapping. Default is None.
+        out_states (Dict[int, Dict] | Any | None): Specifies the output states and
+            their corresponding axes for mapping. Default is None.
+        **transform_kwargs: Additional keyword arguments for the transformation.
+    Returns:
+        Callable: A new function that applies vectorized mapping to the input
+        function while managing states.
+    """
+    # TODO: support jax.disable_jit()
+    # format state axes
+    (
+        axis_to_in_states,
+        in_state_to_axis,
+        axis_to_out_states,
+        out_state_to_axis
+    ) = _format_state_axes(in_states, out_states)
+    # check in_axes
+    if isinstance(in_axes, list):
+        # To be a tree prefix of the positional args tuple, in_axes can never be a
+        # list: if in_axes is not a leaf, it must be a tuple of trees. However,
+        # in cases like these users expect tuples and lists to be treated
+        # essentially interchangeably, so we canonicalize lists to tuples here
+        # rather than raising an error. https://github.com/jax-ml/jax/issues/2367
+        in_axes = tuple(in_axes)
+    def _vmap_fn_for_compilation(in_vmap_state_vals, args):
+        """
+        Compile a function for vectorized mapping (vmap) with state restoration.
+        This internal function is used to prepare a function for vectorized mapping
+        by restoring state values before calling the original function.
+        Args:
+            in_vmap_state_vals (List[List]): A nested list containing the state values
+                to be restored. The outer list corresponds to different axes, while
+                the inner lists contain the state values for each axis.
+            args (Tuple): The arguments to be passed to the original function after
+                state restoration.
+        Returns:
+            Any: The result of calling the original function 'f' with the restored
+            state and provided arguments.
+        """
         # restore state values
         for i, states in enumerate(axis_to_in_states.values()):
-            for state, state_val in zip(states, in_states_[i]):
+            for state, state_val in zip(states, in_vmap_state_vals[i]):
                 state.restore_value(state_val)
         # call the function
-        with StateTraceStack() as stack:
-            outs = f(*args)
+        return f(*args)
+    # stateful function
+    stateful_fn = StatefulFunction(_vmap_fn_for_compilation, name='vmap')
-        # analyze
-        for state in stack.get_write_states():
+    @functools.wraps(f)
+    def new_fn_for_vmap(
+        rng_keys,
+        in_state_vmap_vals,
+        in_state_oth_vals,
+        args,
+    ):
+        """
+        Wrapper function for vectorized mapping (vmap) that handles state restoration and function execution.
+        This function restores state values, random number generators (RNGs), and other state values
+        before calling the original function. It then processes the outputs and prepares them for
+        vectorized mapping.
+        Args:
+            rng_keys (Sequence): Random number generator keys for each mapped instance.
+            in_state_vmap_vals (Sequence[Sequence]): Input state values for vectorized mapping,
+                organized by axis.
+            in_state_oth_vals (Sequence): Other input state values not involved in vectorized mapping.
+            args (Tuple): Arguments to be passed to the original function.
+        Returns:
+            Tuple: A tuple containing four elements:
+                - out_rng_keys (List): Updated RNG keys after function execution.
+                - out_state_vmap_vals (List[List]): Output state values for vectorized mapping,
+                  organized by axis.
+                - out_state_oth_vals (List): Other output state values not involved in vectorized mapping.
+                - outs: The output of the original function call.
+        Raises:
+            AssertionError: If there's a mismatch in the number of states, state values, or RNG keys.
+            BatchAxisError: If a state value is batched but not included in out_states.
+        """
+        # restore vmapping state values
+        for i, states in enumerate(axis_to_in_states.values()):
+            assert len(states) == len(in_state_vmap_vals[i]), (
+                f"The number of states in axis {i} should be equal to the number "
+                f"of state values, but got {len(states)} and {len(in_state_vmap_vals[i])}."
+            )
+            for state, state_val in zip(states, in_state_vmap_vals[i]):
+                state.restore_value(state_val)
+        # restore rngs
+        cache_key = stateful_fn.get_arg_cache_key(in_state_vmap_vals, args)
+        state_trace = stateful_fn.get_state_trace(cache_key)
+        rngs = state_trace.state_subset(RandomState)
+        rng_sets = set(rngs)
+        assert len(rngs) == len(rng_keys), (
+            f"The number of random states in the function should be equal to the number "
+            f"of random keys, but got {len(rngs)} and {len(rng_keys)}."
+        )
+        for rng, key in zip(rngs, rng_keys):
+            rng.restore_value(key)
+        # restore other state values
+        oth_in_state = [
+            st for st in state_trace.states
+            if st not in in_state_to_axis and st not in rng_sets
+        ]
+        assert len(oth_in_state) == len(in_state_oth_vals), (
+            f"The number of states in 'in_states' should be equal to the number "
+            f"of state values, but got {len(oth_in_state)} and {len(in_state_oth_vals)}."
+        )
+        for state, state_val in zip(oth_in_state, in_state_oth_vals):
+            state.restore_value(state_val)
+        # call the function
+        outs = stateful_fn.jaxpr_call_auto(in_state_vmap_vals, args)
+        # analyze vmapping axis error
+        for state in state_trace.get_write_states():
             leaves = jax.tree.leaves(state.value)
-            if isinstance(leaves[0], BatchTracer) and state not in out_state_to_axis:
-                if isinstance(state, RandomState) and id(state) in rng_ids:
+            if any([isinstance(leaf, BatchTracer) for leaf in leaves]) and state not in out_state_to_axis:
+                if isinstance(state, RandomState) and state in rng_sets:
                     continue
                 state.raise_error_with_source_info(
-                    BatchAxisError(
-                        f"The value of State {state} is batched, but it is not in the out_states."
-                    )
+                    BatchAxisError(f"The value of State {state} is batched, "
+                                   f"but it is not in the out_states.")
                 )
-        out_states_ = [
+        # out state values for vmapping
+        out_state_vmap_vals = [
             [state.value for state in states]
             for axis, states in axis_to_out_states.items()
         ]
-        return out_states_, outs
+        out_state_oth_vals = [
+            st.value for st in state_trace.states
+            if st not in out_state_to_axis and st not in rng_sets
+        ]
+        out_rng_keys = [rng.value for rng in rngs]
+        return out_rng_keys, out_state_vmap_vals, out_state_oth_vals, outs
+    @functools.wraps(f)
     def vmapped_fn(*args):
-        # vmapping
-        in_state_vals = [
+        """
+        Applies vectorized mapping (vmap) to the input function while managing state.
+        This function handles the vectorization process, including state management,
+        random number generation, and function compilation. It prepares the input
+        states, compiles the stateful function, manages random number generators,
+        applies the vmap transformation, and restores the output states.
+        Args:
+            *args: Variable length argument list containing the input arguments
+                   to be passed to the vectorized function.
+        Returns:
+            Any: The output of the vectorized function after applying vmap and
+                 managing states.
+        Note:
+            This function assumes the existence of several helper functions and
+            data structures (e.g., axis_to_in_states, in_state_to_axis) which
+            should be defined in the broader context.
+        """
+        # in states values
+        in_state_map_vals = [
             [st.value for st in states]
             for axis, states in axis_to_in_states.items()
         ]
-        in_axes_st = list(axis_to_in_states.keys())
-        out_axes_st = list(axis_to_out_states.keys())
-        if len(in_axes_st) == 0:
-            in_axes_st = 0
-        if len(out_axes_st) == 0:
-            out_axes_st = 0
-        out_state_vals, outs = restore_rngs(
-            jax.vmap(
-                new_fn,
-                in_axes=(in_axes_st, in_axes),
-                out_axes=(out_axes_st, out_axes),
-                **transform_kwargs
-            ),
-            rngs=rngs
-        )(in_state_vals, args)
+        st_in_axes = list(axis_to_in_states.keys())
+        if len(st_in_axes) == 0:
+            st_in_axes = 0
+        # compile stateful function
+        cache_key = _compile_stateful_function(
+            stateful_fn,
+            (st_in_axes, in_axes),
+            (in_state_map_vals, args)
+        )
+        # random keys
+        state_trace = stateful_fn.get_state_trace(cache_key)
+        rngs = state_trace.state_subset(RandomState)
+        rng_sets = set(rngs)
+        if len(rngs):
+            # batch size
+            batch_size = _get_batch_size(args, in_axes, axis_to_in_states, axis_size)
+            rng_keys = tuple(rng.split_key(batch_size) for rng in rngs)
+            rng_backup = tuple(rng.split_key() for rng in rngs)
+        else:
+            rng_keys = tuple()
+            rng_backup = tuple()
+        # in states other values
+        in_state_oth_vals = [
+            st.value
+            for st in state_trace.states
+            if st not in in_state_to_axis and st not in rng_sets
+        ]
+        # out state axis
+        st_out_axes = list(axis_to_out_states.keys())
+        if len(st_out_axes) == 0:
+            st_out_axes = 0
+        # --- vmapping --- #
+        fn = jax.vmap(
+            new_fn_for_vmap,
+            in_axes=(0, st_in_axes, None, in_axes),
+            out_axes=(0, st_out_axes, None, out_axes),
+            axis_size=axis_size,
+            axis_name=axis_name,
+            spmd_axis_name=spmd_axis_name,
+        )
+        _, out_state_map_vals, out_state_oth_vals, outs = fn(
+            rng_keys, in_state_map_vals, in_state_oth_vals, args
+        )
         # restore mapped state values
         for i, states in enumerate(axis_to_out_states.values()):
-            for state, st_val in zip(states, out_state_vals[i]):
+            assert len(states) == len(out_state_map_vals[i]), (
+                f"The number of states in axis {i} should be equal to the number "
+                f"of state values, but got {len(states)} and {len(out_state_map_vals[i])}."
+            )
+            for state, st_val in zip(states, out_state_map_vals[i]):
                 state.restore_value(st_val)
+        # restore other state values
+        out_oth_states = [
+            st for st in state_trace.states
+            if st not in out_state_to_axis and st not in rng_sets
+        ]
+        assert len(out_oth_states) == len(out_state_oth_vals), (
+            f"The number of states in 'out_states' should be equal to the number "
+            f"of state values, but got {len(out_oth_states)} and {len(out_state_oth_vals)}."
+        )
+        for state, st_val in zip(out_oth_states, out_state_oth_vals):
+            state.restore_value(st_val)
+        # restore random keys
+        for rng, key in zip(rngs, rng_backup):
+            rng.restore_value(key)
         return outs
     return vmapped_fn
@@ -166,15 +582,15 @@ def _vmap_transform(
 def vmap(
     fn: F | Missing = Missing(),
     *,
+    # --- normal jax.vmap arguments --- #
     in_axes: int | None | Sequence[Any] = 0,
     out_axes: Any = 0,
     axis_name: AxisName | None = None,
     axis_size: int | None = None,
     spmd_axis_name: AxisName | tuple[AxisName, ...] | None = None,
-    # brainstate specific arguments
+    # --- brainstate specific arguments --- #
     in_states: Dict[int, Dict] | Any | None = None,
     out_states: Dict[int, Dict] | Any | None = None,
-    rngs: Union[RandomState, Sequence[RandomState]] = DEFAULT,
 ) -> F | Callable[[F], F]:
     """
     Vectorizing map. Creates a function which maps ``fun`` over argument axes.
@@ -229,10 +645,6 @@ def vmap(
             corresponds to the outermost :func:`vmap` call, the second element to
             the next outermost, and so on. If the tuple is not provided, the
             ``axis_name`` is used for all nested :func:`vmap` calls.
-        rngs: Optional, a random number generator or sequence of random number
-            generators to be used in the mapped function. These random number
-            generators are restored their random key after the mapped function is
-            executed.
         in_states: Optional, the :class:`State` objects to be mapped over in the inputs.
         out_states: Optional, the :class:`State` objects to be mapped over in the outputs.
@@ -254,7 +666,6 @@ def vmap(
             axis_name=axis_name,
             axis_size=axis_size,
             spmd_axis_name=spmd_axis_name,
-            rngs=rngs,
         )  # type: ignore[return-value]
     return _vmap_transform(
@@ -266,7 +677,6 @@ def vmap(
         axis_name=axis_name,
         axis_size=axis_size,
         spmd_axis_name=spmd_axis_name,
-        rngs=rngs
     )
@@ -511,3 +921,113 @@ def map(
 def flatten_(x):
     return x.reshape(-1, *x.shape[2:])
+def _vmap_new_states_transform(
+    fun: Callable[..., Any],
+    *,
+    # -- normal jax.vmap arguments -- #
+    in_axes: int | None | Sequence[Any] = 0,
+    out_axes: Any = 0,
+    axis_name: AxisName | None = None,
+    axis_size: int | None = None,
+    spmd_axis_name: AxisName | tuple[AxisName, ...] | None = None,
+    # -- brainstate specific arguments -- #
+    state_tag: str | None = None,
+    state_to_exclude: Filter | None = None,
+):
+    # TODO: How about nested call ``vmap_new_states``?
+    @vmap(
+        in_axes=in_axes,
+        out_axes=out_axes,
+        axis_name=axis_name,
+        axis_size=axis_size,
+        spmd_axis_name=spmd_axis_name,
+    )
+    def new_fun(args):
+        # call the function
+        with catch_new_states(state_tag=state_tag, state_to_exclude=state_to_exclude) as catcher:
+            out = fun(*args)
+        # get vmap state values
+        vmap_state_vals = catcher.get_state_values()
+        return out, vmap_state_vals
+    @functools.wraps(fun)
+    def vmapped_fn(*args):
+        # vmapping
+        with catch_new_states(state_to_exclude=state_to_exclude) as catcher:
+            outs, vmap_state_vals = new_fun(args)
+            vmap_states = catcher.get_states()
+        # restore vmapped state values
+        for st_val, st in zip(vmap_state_vals, vmap_states):
+            st.restore_value(st_val)
+            # ------------------------------------------------
+            # --- this is CRUCIAL to avoid jax tracing leakage
+            # ------------------------------------------------
+            st.decrease_stack_level()
+        return outs
+    return vmapped_fn
+def vmap_new_states(
+    fun: Callable = Missing(),
+    *,
+    # -- normal jax.vmap arguments -- #
+    in_axes: int | None | Sequence[Any] = 0,
+    out_axes: Any = 0,
+    axis_name: AxisName | None = None,
+    axis_size: int | None = None,
+    spmd_axis_name: AxisName | tuple[AxisName, ...] | None = None,
+    # -- brainstate specific arguments -- #
+    state_tag: str | None = None,
+    state_to_exclude: Filter = None,
+):
+    """
+    Vectorize a function over new states created within it.
+    This function applies JAX's vmap transformation to newly created states
+    during the function's execution. It allows for more
+    flexible vectorization in the context of stateful computations.
+    Args:
+        fun (Callable, optional): The function to be vectorized. Defaults to Missing().
+        in_axes (int | None | Sequence[Any], optional): Specification of input axes for vectorization. Defaults to 0.
+        out_axes (Any, optional): Specification of output axes after vectorization. Defaults to 0.
+        axis_name (AxisName, optional): Name of the axis being vectorized over. Defaults to None.
+        axis_size (int, optional): Size of the axis being vectorized over. Defaults to None.
+        spmd_axis_name (AxisName | tuple[AxisName, ...], optional): Name(s) of SPMD axis/axes. Defaults to None.
+        state_tag (str, optional): A tag to identify specific states. Defaults to None.
+        state_to_exclude (Sequence[int], optional): Indices of states to exclude from vectorization. Defaults to ().
+    Returns:
+        Callable: A vectorized version of the input function that handles new state creation.
+    """
+    if isinstance(fun, Missing):
+        return functools.partial(
+            _vmap_new_states_transform,
+            in_axes=in_axes,
+            out_axes=out_axes,
+            axis_name=axis_name,
+            axis_size=axis_size,
+            spmd_axis_name=spmd_axis_name,
+            state_tag=state_tag,
+            state_to_exclude=state_to_exclude,
+        )
+    else:
+        return _vmap_new_states_transform(
+            fun,
+            in_axes=in_axes,
+            out_axes=out_axes,
+            axis_name=axis_name,
+            axis_size=axis_size,
+            spmd_axis_name=spmd_axis_name,
+            state_tag=state_tag,
+            state_to_exclude=state_to_exclude,
+        )

brainstate 0.1.0.post20250212__py2.py3-none-any.whl → 0.1.0.post20250217__py2.py3-none-any.whl

brainstate 0.1.0.post20250212py2.py3-none-any.whl → 0.1.0.post20250217py2.py3-none-any.whl