PyPI - brainstate - Versions diffs - 0.1.9__py2.py3-none-any.whl → 0.2.0__py2.py3-none-any.whl - Mend

brainstate 0.1.9py2.py3-none-any.whl → 0.2.0py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (163) hide show

brainstate/__init__.py +130 -19
brainstate/_compatible_import.py +201 -9
brainstate/_compatible_import_test.py +681 -0
brainstate/_deprecation.py +210 -0
brainstate/_deprecation_test.py +2319 -0
brainstate/{util/error.py → _error.py} +10 -20
brainstate/_state.py +94 -47
brainstate/_state_test.py +1 -1
brainstate/_utils.py +1 -1
brainstate/environ.py +1279 -347
brainstate/environ_test.py +1187 -26
brainstate/graph/__init__.py +6 -13
brainstate/graph/_node.py +240 -0
brainstate/graph/_node_test.py +589 -0
brainstate/graph/{_graph_operation.py → _operation.py} +632 -746
brainstate/graph/_operation_test.py +1147 -0
brainstate/mixin.py +1209 -141
brainstate/mixin_test.py +991 -51
brainstate/nn/__init__.py +74 -72
brainstate/nn/_activations.py +587 -295
brainstate/nn/_activations_test.py +109 -86
brainstate/nn/_collective_ops.py +393 -274
brainstate/nn/_collective_ops_test.py +746 -15
brainstate/nn/_common.py +114 -66
brainstate/nn/_common_test.py +154 -0
brainstate/nn/_conv.py +1652 -143
brainstate/nn/_conv_test.py +838 -227
brainstate/nn/_delay.py +95 -29
brainstate/nn/_delay_test.py +25 -20
brainstate/nn/_dropout.py +359 -167
brainstate/nn/_dropout_test.py +429 -52
brainstate/nn/_dynamics.py +14 -90
brainstate/nn/_dynamics_test.py +1 -12
brainstate/nn/_elementwise.py +492 -313
brainstate/nn/_elementwise_test.py +806 -145
brainstate/nn/_embedding.py +369 -19
brainstate/nn/_embedding_test.py +156 -0
brainstate/nn/{_fixedprob.py → _event_fixedprob.py} +10 -16
brainstate/nn/{_fixedprob_test.py → _event_fixedprob_test.py} +6 -5
brainstate/nn/{_linear_mv.py → _event_linear.py} +2 -2
brainstate/nn/{_linear_mv_test.py → _event_linear_test.py} +6 -5
brainstate/nn/_exp_euler.py +200 -38
brainstate/nn/_exp_euler_test.py +350 -8
brainstate/nn/_linear.py +391 -71
brainstate/nn/_linear_test.py +427 -59
brainstate/nn/_metrics.py +1070 -0
brainstate/nn/_metrics_test.py +611 -0
brainstate/nn/_module.py +10 -3
brainstate/nn/_module_test.py +1 -1
brainstate/nn/_normalizations.py +688 -329
brainstate/nn/_normalizations_test.py +663 -37
brainstate/nn/_paddings.py +1020 -0
brainstate/nn/_paddings_test.py +723 -0
brainstate/nn/_poolings.py +1404 -342
brainstate/nn/_poolings_test.py +828 -92
brainstate/nn/{_rate_rnns.py → _rnns.py} +446 -54
brainstate/nn/_rnns_test.py +593 -0
brainstate/nn/_utils.py +132 -5
brainstate/nn/_utils_test.py +402 -0
brainstate/{init/_random_inits.py → nn/init.py} +301 -45
brainstate/{init/_random_inits_test.py → nn/init_test.py} +51 -20
brainstate/random/__init__.py +247 -1
brainstate/random/_rand_funs.py +668 -346
brainstate/random/_rand_funs_test.py +74 -1
brainstate/random/_rand_seed.py +541 -76
brainstate/random/_rand_seed_test.py +1 -1
brainstate/random/_rand_state.py +601 -393
brainstate/random/_rand_state_test.py +551 -0
brainstate/transform/__init__.py +59 -0
brainstate/transform/_ad_checkpoint.py +176 -0
brainstate/{compile → transform}/_ad_checkpoint_test.py +1 -1
brainstate/{augment → transform}/_autograd.py +360 -113
brainstate/{augment → transform}/_autograd_test.py +2 -2
brainstate/transform/_conditions.py +316 -0
brainstate/{compile → transform}/_conditions_test.py +11 -11
brainstate/{compile → transform}/_error_if.py +22 -20
brainstate/{compile → transform}/_error_if_test.py +1 -1
brainstate/transform/_eval_shape.py +145 -0
brainstate/{augment → transform}/_eval_shape_test.py +1 -1
brainstate/{compile → transform}/_jit.py +99 -46
brainstate/{compile → transform}/_jit_test.py +3 -3
brainstate/{compile → transform}/_loop_collect_return.py +219 -80
brainstate/{compile → transform}/_loop_collect_return_test.py +1 -1
brainstate/{compile → transform}/_loop_no_collection.py +133 -34
brainstate/{compile → transform}/_loop_no_collection_test.py +2 -2
brainstate/transform/_make_jaxpr.py +2016 -0
brainstate/transform/_make_jaxpr_test.py +1510 -0
brainstate/transform/_mapping.py +529 -0
brainstate/transform/_mapping_test.py +194 -0
brainstate/{compile → transform}/_progress_bar.py +78 -25
brainstate/{augment → transform}/_random.py +65 -45
brainstate/{compile → transform}/_unvmap.py +102 -5
brainstate/transform/_util.py +286 -0
brainstate/typing.py +594 -61
brainstate/typing_test.py +780 -0
brainstate/util/__init__.py +9 -32
brainstate/util/_others.py +1025 -0
brainstate/util/_others_test.py +962 -0
brainstate/util/_pretty_pytree.py +1301 -0
brainstate/util/_pretty_pytree_test.py +675 -0
brainstate/util/{pretty_repr.py → _pretty_repr.py} +161 -27
brainstate/util/_pretty_repr_test.py +696 -0
brainstate/util/filter.py +557 -81
brainstate/util/filter_test.py +912 -0
brainstate/util/struct.py +769 -382
brainstate/util/struct_test.py +602 -0
{brainstate-0.1.9.dist-info → brainstate-0.2.0.dist-info}/METADATA +34 -17
brainstate-0.2.0.dist-info/RECORD +111 -0
brainstate/augment/__init__.py +0 -30
brainstate/augment/_eval_shape.py +0 -99
brainstate/augment/_mapping.py +0 -1060
brainstate/augment/_mapping_test.py +0 -597
brainstate/compile/__init__.py +0 -38
brainstate/compile/_ad_checkpoint.py +0 -204
brainstate/compile/_conditions.py +0 -256
brainstate/compile/_make_jaxpr.py +0 -888
brainstate/compile/_make_jaxpr_test.py +0 -156
brainstate/compile/_util.py +0 -147
brainstate/functional/__init__.py +0 -27
brainstate/graph/_graph_node.py +0 -244
brainstate/graph/_graph_node_test.py +0 -73
brainstate/graph/_graph_operation_test.py +0 -563
brainstate/init/__init__.py +0 -26
brainstate/init/_base.py +0 -52
brainstate/init/_generic.py +0 -244
brainstate/init/_regular_inits.py +0 -105
brainstate/init/_regular_inits_test.py +0 -50
brainstate/nn/_inputs.py +0 -608
brainstate/nn/_ltp.py +0 -28
brainstate/nn/_neuron.py +0 -705
brainstate/nn/_neuron_test.py +0 -161
brainstate/nn/_others.py +0 -46
brainstate/nn/_projection.py +0 -486
brainstate/nn/_rate_rnns_test.py +0 -63
brainstate/nn/_readout.py +0 -209
brainstate/nn/_readout_test.py +0 -53
brainstate/nn/_stp.py +0 -236
brainstate/nn/_synapse.py +0 -505
brainstate/nn/_synapse_test.py +0 -131
brainstate/nn/_synaptic_projection.py +0 -423
brainstate/nn/_synouts.py +0 -162
brainstate/nn/_synouts_test.py +0 -57
brainstate/nn/metrics.py +0 -388
brainstate/optim/__init__.py +0 -38
brainstate/optim/_base.py +0 -64
brainstate/optim/_lr_scheduler.py +0 -448
brainstate/optim/_lr_scheduler_test.py +0 -50
brainstate/optim/_optax_optimizer.py +0 -152
brainstate/optim/_optax_optimizer_test.py +0 -53
brainstate/optim/_sgd_optimizer.py +0 -1104
brainstate/random/_random_for_unit.py +0 -52
brainstate/surrogate.py +0 -1957
brainstate/transform.py +0 -23
brainstate/util/caller.py +0 -98
brainstate/util/others.py +0 -540
brainstate/util/pretty_pytree.py +0 -945
brainstate/util/pretty_pytree_test.py +0 -159
brainstate/util/pretty_table.py +0 -2954
brainstate/util/scaling.py +0 -258
brainstate-0.1.9.dist-info/RECORD +0 -130
{brainstate-0.1.9.dist-info → brainstate-0.2.0.dist-info}/WHEEL +0 -0
{brainstate-0.1.9.dist-info → brainstate-0.2.0.dist-info}/licenses/LICENSE +0 -0
{brainstate-0.1.9.dist-info → brainstate-0.2.0.dist-info}/top_level.txt +0 -0

brainstate/graph/{_graph_operation.py → _operation.py} RENAMED Viewed

@@ -20,7 +20,7 @@ from __future__ import annotations
 import dataclasses
 from typing import (
     Any, Callable, Generic, Iterable, Iterator, Mapping, MutableMapping,
-    Sequence, Type, TypeVar, Union, Hashable, Tuple, Dict, Optional, overload
+    Sequence, Type, TypeVar, Union, Hashable, Tuple, Dict, Optional
 )
 import jax
@@ -30,25 +30,40 @@ from typing_extensions import TypeGuard, Unpack
 from brainstate._state import State, TreefyState
 from brainstate._utils import set_module_as
 from brainstate.typing import PathParts, Filter, Predicate, Key
-from brainstate.util.caller import ApplyCaller, CallableProxy, DelayedAccessor
-from brainstate.util.pretty_pytree import NestedDict, FlattedDict, PrettyDict
-from brainstate.util.pretty_repr import PrettyRepr, PrettyType, PrettyAttr, PrettyMapping, MappingReprMixin
-from brainstate.util.struct import FrozenDict
+from brainstate.util._pretty_pytree import NestedDict, FlattedDict, PrettyDict
+from brainstate.util._pretty_repr import PrettyRepr, PrettyType, PrettyAttr, PrettyMapping, MappingReprMixin
 from brainstate.util.filter import to_predicate
-_max_int = np.iinfo(np.int32).max
+from brainstate.util.struct import FrozenDict
 __all__ = [
+    'register_graph_node_type',
     # state management in the given graph or node
-    'pop_states', 'nodes', 'states', 'treefy_states', 'update_states',
+    'pop_states',
+    'nodes',
+    'states',
+    'treefy_states',
+    'update_states',
     # graph node operations
-    'flatten', 'unflatten', 'treefy_split', 'treefy_merge', 'iter_leaf', 'iter_node', 'clone', 'graphdef', 'call',
+    'flatten',
+    'unflatten',
+    'treefy_split',
+    'treefy_merge',
+    'iter_leaf',
+    'iter_node',
+    'clone',
+    'graphdef',
     # others
-    'RefMap', 'GraphDef', 'NodeRef', 'NodeDef'
+    'RefMap',
+    'GraphDef',
+    'NodeDef',
+    'NodeRef',
 ]
+MAX_INT = np.iinfo(np.int32).max
 A = TypeVar('A')
 B = TypeVar('B')
 C = TypeVar('C')
@@ -65,12 +80,11 @@ AuxData = TypeVar('AuxData')
 StateLeaf = TreefyState[Any]
 NodeLeaf = State[Any]
-GraphStateMapping = NestedDict[Key, StateLeaf]
+GraphStateMapping = NestedDict
 # --------------------------------------------------------
 def _is_state_leaf(x: Any) -> TypeGuard[StateLeaf]:
     return isinstance(x, TreefyState)
@@ -86,13 +100,30 @@ class RefMap(MutableMapping[A, B], MappingReprMixin[A, B]):
     This mapping is useful when we want to keep track of objects
     that are being referenced by other objects.
-    Args:
-      mapping: A mapping or iterable of key-value pairs.
+    Parameters
+    ----------
+    mapping : Mapping[A, B] or Iterable[Tuple[A, B]], optional
+        A mapping or iterable of key-value pairs.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> obj1 = object()
+        >>> obj2 = object()
+        >>> ref_map = brainstate.graph.RefMap()
+        >>> ref_map[obj1] = 'value1'
+        >>> ref_map[obj2] = 'value2'
+        >>> print(obj1 in ref_map)
+        True
+        >>> print(ref_map[obj1])
+        value1
     """
     __module__ = 'brainstate.graph'
-    def __init__(self, mapping: Mapping[A, B] | Iterable[Tuple[A, B]] = ()):
+    def __init__(self, mapping: Union[Mapping[A, B], Iterable[Tuple[A, B]]] = ()) -> None:
         self._mapping: Dict[int, Tuple[A, B]] = {}
         self.update(mapping)
@@ -102,10 +133,10 @@ class RefMap(MutableMapping[A, B], MappingReprMixin[A, B]):
     def __contains__(self, key: Any) -> bool:
         return id(key) in self._mapping
-    def __setitem__(self, key: A, value: B):
+    def __setitem__(self, key: A, value: B) -> None:
         self._mapping[id(key)] = (key, value)
-    def __delitem__(self, key: A):
+    def __delitem__(self, key: A) -> None:
         del self._mapping[id(key)]
     def __iter__(self) -> Iterator[A]:
@@ -135,7 +166,7 @@ class GraphNodeImpl(NodeImplBase[Node, Leaf, AuxData]):
     create_empty: Callable[[AuxData], Node]
     clear: Callable[[Node], None]
-    def init(self, node: Node, items: Tuple[Tuple[Key, Leaf], ...]):
+    def init(self, node: Node, items: Tuple[Tuple[Key, Leaf], ...]) -> None:
         for key, value in items:
             self.set_key(node, key, value)
@@ -151,7 +182,7 @@ NodeImpl = Union[GraphNodeImpl[Node, Leaf, AuxData], PyTreeNodeImpl[Node, Leaf,
 # Graph Node implementation: start
 # --------------------------------------------------------
-_node_impl_for_type: dict[type, NodeImpl[Any, Any, Any]] = {}
+_node_impl_for_type: dict[type, NodeImpl] = {}
 def register_graph_node_type(
@@ -165,13 +196,56 @@ def register_graph_node_type(
     """
     Register a graph node type.
-    Args:
-      type: The type of the node.
-      flatten: A function that flattens the node into a sequence of key-value pairs.
-      set_key: A function that sets a key in the node.
-      pop_key: A function that pops a key from the node.
-      create_empty: A function that creates an empty node.
-      clear: A function that clears the node
+    Parameters
+    ----------
+    type : type
+        The type of the node.
+    flatten : Callable[[Node], tuple[Sequence[tuple[Key, Leaf]], AuxData]]
+        A function that flattens the node into a sequence of key-value pairs.
+    set_key : Callable[[Node, Key, Leaf], None]
+        A function that sets a key in the node.
+    pop_key : Callable[[Node, Key], Leaf]
+        A function that pops a key from the node.
+    create_empty : Callable[[AuxData], Node]
+        A function that creates an empty node.
+    clear : Callable[[Node], None]
+        A function that clears the node.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> # Custom node type implementation
+        >>> class CustomNode:
+        ...     def __init__(self):
+        ...         self.data = {}
+        ...
+        >>> def flatten_custom(node):
+        ...     return list(node.data.items()), None
+        ...
+        >>> def set_key_custom(node, key, value):
+        ...     node.data[key] = value
+        ...
+        >>> def pop_key_custom(node, key):
+        ...     return node.data.pop(key)
+        ...
+        >>> def create_empty_custom(metadata):
+        ...     return CustomNode()
+        ...
+        >>> def clear_custom(node):
+        ...     node.data.clear()
+        ...
+        >>> # Register the custom node type
+        >>> brainstate.graph.register_graph_node_type(
+        ...     CustomNode,
+        ...     flatten_custom,
+        ...     set_key_custom,
+        ...     pop_key_custom,
+        ...     create_empty_custom,
+        ...     clear_custom
+        ... )
     """
     _node_impl_for_type[type] = GraphNodeImpl(
         type=type,
@@ -200,11 +274,11 @@ def _is_graph_node(x: Any) -> bool:
     return type(x) in _node_impl_for_type
-def _is_node_type(x: type[Any]) -> bool:
+def _is_node_type(x: Type[Any]) -> bool:
     return x in _node_impl_for_type or x is PytreeType
-def _get_node_impl(x: Node) -> NodeImpl[Node, Any, Any]:
+def _get_node_impl(x: Any) -> NodeImpl:
     if isinstance(x, State):
         raise ValueError(f'State is not a node: {x}')
@@ -218,14 +292,14 @@ def _get_node_impl(x: Node) -> NodeImpl[Node, Any, Any]:
     return _node_impl_for_type[node_type]
-def get_node_impl_for_type(x: type[Node]) -> NodeImpl[Node, Any, Any]:
+def get_node_impl_for_type(x: Type[Any]) -> NodeImpl:
     if x is PytreeType:
         return PYTREE_NODE_IMPL
     return _node_impl_for_type[x]
 class HashableMapping(Mapping[HA, HB], Hashable):
-    def __init__(self, mapping: Mapping[HA, HB] | Iterable[tuple[HA, HB]]):
+    def __init__(self, mapping: Union[Mapping[HA, HB], Iterable[tuple[HA, HB]]]) -> None:
         self._mapping = dict(mapping)
     def __contains__(self, key: object) -> bool:
@@ -259,57 +333,53 @@ class GraphDef(Generic[Node]):
     - index: The index of the node in the graph.
     It has two concrete subclasses:
     - :class:`NodeRef`: A reference to a node in the graph.
     - :class:`NodeDef`: A dataclass that denotes the graph structure of a :class:`Node` or a :class:`State`.
-    """
-    type: type[Node]
-    index: int
-@dataclasses.dataclass(frozen=True, repr=False)
-class NodeRef(GraphDef[Node], PrettyRepr):
-    """
-    A reference to a node in the graph.
+    Attributes
+    ----------
+    type : Type[Node]
+        The type of the node.
+    index : int
+        The index of the node in the graph.
-    The node can be instances of :class:`Node` or :class:`State`.
     """
-    type: type[Node]
+    type: Type[Node]
     index: int
-    def __pretty_repr__(self):
-        yield PrettyType(type=type(self))
-        yield PrettyAttr('type', self.type.__name__)
-        yield PrettyAttr('index', self.index)
-    def __treescope_repr__(self, path, subtree_renderer):
-        """
-        Treescope repr for the object.
-        """
-        import treescope  # type: ignore[import-not-found,import-untyped]
-        return treescope.repr_lib.render_object_constructor(
-            object_type=type(self),
-            attributes={'type': self.type, 'index': self.index},
-            path=path,
-            subtree_renderer=subtree_renderer,
-        )
-jax.tree_util.register_static(NodeRef)
 @dataclasses.dataclass(frozen=True, repr=False)
 class NodeDef(GraphDef[Node], PrettyRepr):
     """
     A dataclass that denotes the tree structure of a node, either :class:`Node` or :class:`State`.
+    Attributes
+    ----------
+    type : Type[Node]
+        Type of the node.
+    index : int
+        Index of the node in the graph.
+    attributes : Tuple[Key, ...]
+        Attributes for the node.
+    subgraphs : HashableMapping[Key, NodeDef[Any] | NodeRef[Any]]
+        Mapping of subgraph definitions.
+    static_fields : HashableMapping
+        Mapping of static fields.
+    leaves : HashableMapping[Key, NodeRef[Any] | None]
+        Mapping of leaf nodes.
+    metadata : Hashable
+        Metadata associated with the node.
+    index_mapping : FrozenDict[Index, Index] | None
+        Index mapping for node references.
     """
     type: Type[Node]  # type of the node
     index: int  # index of the node in the graph
     attributes: Tuple[Key, ...]  # attributes for the node
     subgraphs: HashableMapping[Key, NodeDef[Any] | NodeRef[Any]]
-    static_fields: HashableMapping[Key, Any]
+    static_fields: HashableMapping
     leaves: HashableMapping[Key, NodeRef[Any] | None]
     metadata: Hashable
     index_mapping: FrozenDict[Index, Index] | None
@@ -321,7 +391,7 @@ class NodeDef(GraphDef[Node], PrettyRepr):
         index: int,
         attributes: tuple[Key, ...],
         subgraphs: Iterable[tuple[Key, NodeDef[Any] | NodeRef[Any]]],
-        static_fields: Iterable[tuple[Key, Any]],
+        static_fields: Iterable[tuple],
         leaves: Iterable[tuple[Key, NodeRef[Any] | None]],
         metadata: Hashable,
         index_mapping: Mapping[Index, Index] | None,
@@ -349,24 +419,35 @@ class NodeDef(GraphDef[Node], PrettyRepr):
         yield PrettyAttr('metadata', self.metadata)
         yield PrettyAttr('index_mapping', PrettyMapping(self.index_mapping) if self.index_mapping is not None else None)
-    def apply(
-        self,
-        state_map: GraphStateMapping,
-        *state_maps: GraphStateMapping
-    ) -> ApplyCaller[tuple[GraphDef[Node], GraphStateMapping]]:
-        accessor = DelayedAccessor()
-        def _apply(accessor: DelayedAccessor, *args, **kwargs) -> tuple[
-            Any, tuple[GraphDef[Node], GraphStateMapping]]:
-            module = treefy_merge(self, state_map, *state_maps)
-            fn = accessor(module)
-            out = fn(*args, **kwargs)
-            return out, flatten(module)
+jax.tree_util.register_static(NodeDef)
+@dataclasses.dataclass(frozen=True, repr=False)
+class NodeRef(GraphDef[Node], PrettyRepr):
+    """
+    A reference to a node in the graph.
+    The node can be instances of :class:`Node` or :class:`State`.
-        return CallableProxy(_apply, accessor)  # type: ignore
+    Attributes
+    ----------
+    type : Type[Node]
+        The type of the node being referenced.
+    index : int
+        The index of the node in the graph.
+    """
+    type: Type[Node]
+    index: int
-jax.tree_util.register_static(NodeDef)
+    def __pretty_repr__(self):
+        yield PrettyType(type=type(self))
+        yield PrettyAttr('type', self.type.__name__)
+        yield PrettyAttr('index', self.index)
+jax.tree_util.register_static(NodeRef)
 # --------------------------------------------------------
@@ -378,20 +459,30 @@ def _graph_flatten(
     path: PathParts,
     ref_index: RefMap[Any, Index],
     flatted_state_mapping: Dict[PathParts, StateLeaf],
-    node: Node,
+    node: Any,
     treefy_state: bool = False,
-):
+) -> Union[NodeDef[Any], NodeRef[Any]]:
     """
     Recursive helper for graph flatten.
-    Args:
-      path: The path to the node.
-      ref_index: A mapping from nodes to indexes.
-      flatted_state_mapping: A mapping from paths to state leaves.
-      node: The node to flatten.
+    Parameters
+    ----------
+    path : PathParts
+        The path to the node.
+    ref_index : RefMap[Any, Index]
+        A mapping from nodes to indexes.
+    flatted_state_mapping : Dict[PathParts, StateLeaf]
+        A mapping from paths to state leaves.
+    node : Node
+        The node to flatten.
+    treefy_state : bool, optional
+        Whether to convert states to TreefyState, by default False.
+    Returns
+    -------
+    NodeDef or NodeRef
+        A NodeDef or a NodeRef.
-    Returns:
-      A NodeDef or a NodeRef.
     """
     if not _is_node(node):
         raise RuntimeError(f'Unsupported type: {type(node)}, this is a bug.')
@@ -417,9 +508,9 @@ def _graph_flatten(
     else:
         index = -1
-    subgraphs: list[tuple[Key, NodeDef[Node] | NodeRef]] = []
-    static_fields: list[tuple[Key, Any]] = []
-    leaves: list[tuple[Key, NodeRef | None]] = []
+    subgraphs: list[tuple[Key, Union[NodeDef[Any], NodeRef[Any]]]] = []
+    static_fields: list[tuple] = []
+    leaves: list[tuple[Key, Union[NodeRef[Any], None]]] = []
     # Flatten the node into a sequence of key-value pairs.
     values, metadata = node_impl.flatten(node)
@@ -450,41 +541,56 @@ def _graph_flatten(
             # The value is a static field.
             static_fields.append((key, value))
-    nodedef = NodeDef.create(type=node_impl.type,
-                             index=index,
-                             attributes=tuple(key for key, _ in values),
-                             subgraphs=subgraphs,
-                             static_fields=static_fields,
-                             leaves=leaves,
-                             metadata=metadata,
-                             index_mapping=None, )
+    nodedef = NodeDef.create(
+        type=node_impl.type,
+        index=index,
+        attributes=tuple(key for key, _ in values),
+        subgraphs=subgraphs,
+        static_fields=static_fields,
+        leaves=leaves,
+        metadata=metadata,
+        index_mapping=None,
+    )
     return nodedef
 @set_module_as('brainstate.graph')
 def flatten(
-    node: Node,
+    node: Any,
     /,
     ref_index: Optional[RefMap[Any, Index]] = None,
     treefy_state: bool = True,
-) -> Tuple[GraphDef, NestedDict]:
+) -> Tuple[GraphDef[Any], NestedDict]:
     """
     Flattens a graph node into a (graph_def, state_mapping) pair.
-    Example::
-        >>> import brainstate as brainstate
+    Parameters
+    ----------
+    node : Node
+        A graph node.
+    ref_index : RefMap[Any, Index], optional
+        A mapping from nodes to indexes, defaults to None. If not provided, a new
+        empty dictionary is created. This argument can be used to flatten a sequence of graph
+        nodes that share references.
+    treefy_state : bool, optional
+        If True, the state mapping will be a NestedDict instead of a flat dictionary.
+        Default is True.
+    Returns
+    -------
+    tuple[GraphDef, NestedDict]
+        A tuple containing the graph definition and state mapping.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
         >>> node = brainstate.graph.Node()
-        >>> graph_def, state_mapping = flatten(node)
+        >>> graph_def, state_mapping = brainstate.graph.flatten(node)
         >>> print(graph_def)
         >>> print(state_mapping)
-    Args:
-        node: A graph node.
-        ref_index: A mapping from nodes to indexes, defaults to None. If not provided, a new
-                 empty dictionary is created. This argument can be used to flatten a sequence of graph
-                 nodes that share references.
-        treefy_state: If True, the state mapping will be a NestedDict instead of a flat dictionary.
     """
     ref_index = RefMap() if ref_index is None else ref_index
     assert isinstance(ref_index, RefMap), f"ref_index must be a RefMap. But we got: {ref_index}"
@@ -493,8 +599,13 @@ def flatten(
     return graph_def, NestedDict.from_flat(flatted_state_mapping)
-def _get_children(graph_def, state_mapping, index_ref, index_ref_cache):
-    children: dict[Key, StateLeaf | Node] = {}
+def _get_children(
+    graph_def: NodeDef[Any],
+    state_mapping: Mapping,
+    index_ref: dict[Index, Any],
+    index_ref_cache: Optional[dict[Index, Any]],
+) -> dict[Key, Union[StateLeaf, Any]]:
+    children: dict[Key, Union[StateLeaf, Any]] = {}
     # NOTE: we could allow adding new StateLeafs here
     # All state keys must be present in the graph definition (the object attributes)
@@ -506,8 +617,8 @@ def _get_children(graph_def, state_mapping, index_ref, index_ref_cache):
     #  - (3) the key can be a subgraph, a leaf, or a static attribute
     for key in graph_def.attributes:
         if key not in state_mapping:  # static field
-            # TODO(cgarcia): maybe we shouldn't support unflattening with missing keys?
-            # if key is not present, create an empty types
+            # Support unflattening with missing keys for static fields and subgraphs
+            # This allows partial state restoration and flexible graph reconstruction
             if key in graph_def.static_fields:
                 children[key] = graph_def.static_fields[key]
@@ -534,8 +645,10 @@ def _get_children(graph_def, state_mapping, index_ref, index_ref_cache):
                 else:
                     # key for a variable is missing, raise an error
-                    raise ValueError(f'Expected key {key!r} in state while building node of type '
-                                     f'{graph_def.type.__name__}.')
+                    raise ValueError(
+                        f'Expected key {key!r} in state while building node of type '
+                        f'{graph_def.type.__name__}.'
+                    )
             else:
                 raise RuntimeError(f'Unknown static field: {key!r}')
@@ -551,8 +664,11 @@ def _get_children(graph_def, state_mapping, index_ref, index_ref_cache):
             if key in graph_def.subgraphs:
                 # if _is_state_leaf(value):
                 if isinstance(value, (TreefyState, State)):
-                    raise ValueError(f'Expected value of type {graph_def.subgraphs[key]} '
-                                     f'for {key!r}, but got {value!r}')
+                    raise ValueError(
+                        f'Expected value of type {graph_def.subgraphs[key]} '
+                        f'for {key!r}, but got {value!r}'
+                    )
                 if not isinstance(value, dict):
                     raise TypeError(f'Expected a dict for {key!r}, but got {type(value)}.')
@@ -574,8 +690,8 @@ def _get_children(graph_def, state_mapping, index_ref, index_ref_cache):
                     # TreefyState presumbly created by modifying the NestedDict
                     if isinstance(value, TreefyState):
                         value = value.to_state()
-                    # elif isinstance(value, State):
-                    #     value = value
+                    elif isinstance(value, State):
+                        value = value
                     children[key] = value
                 elif noderef.index in index_ref:
@@ -585,7 +701,10 @@ def _get_children(graph_def, state_mapping, index_ref, index_ref_cache):
                 else:
                     # it is an unseen variable, create a new one
                     if not isinstance(value, (TreefyState, State)):
-                        raise ValueError(f'Expected a State type for {key!r}, but got {type(value)}.')
+                        raise ValueError(
+                            f'Expected a State type for {key!r}, but got {type(value)}.'
+                        )
                     # when idxmap is present, check if the Varable exists there
                     # and update existing variables if it does
                     if index_ref_cache is not None and noderef.index in index_ref_cache:
@@ -618,11 +737,11 @@ def _get_children(graph_def, state_mapping, index_ref, index_ref_cache):
 def _graph_unflatten(
-    graph_def: NodeDef[Node] | NodeRef[Node],
-    state_mapping: Mapping[Key, StateLeaf | Mapping[Key, Any]],
+    graph_def: Union[NodeDef[Any], NodeRef[Any]],
+    state_mapping: Mapping[Key, Union[StateLeaf, Mapping]],
     index_ref: dict[Index, Any],
-    index_ref_cache: dict[Index, Any] | None,
-) -> Node:
+    index_ref_cache: Optional[dict[Index, Any]],
+) -> Any:
     """
     Recursive helper for graph unflatten.
@@ -697,175 +816,57 @@ def _graph_unflatten(
 @set_module_as('brainstate.graph')
 def unflatten(
-    graph_def: GraphDef,
-    state_mapping: NestedDict[Key, StateLeaf],
+    graph_def: GraphDef[Any],
+    state_mapping: NestedDict,
     /,
     *,
-    index_ref: dict[Index, Any] | None = None,
-    index_ref_cache: dict[Index, Any] | None = None,
-) -> Node:
+    index_ref: Optional[dict[Index, Any]] = None,
+    index_ref_cache: Optional[dict[Index, Any]] = None,
+) -> Any:
     """
     Unflattens a graphdef into a node with the given state tree mapping.
-    Example::
-    >>> import brainstate as brainstate
-    >>> class MyNode(brainstate.graph.Node):
-    ...   def __init__(self):
-    ...      self.a = brainstate.nn.Linear(2, 3)
-    ...      self.b = brainstate.nn.Linear(3, 4)
-    ...      self.c = [brainstate.nn.Linear(4, 5), brainstate.nn.Linear(5, 6)]
-    ...      self.d = {'x': brainstate.nn.Linear(6, 7), 'y': brainstate.nn.Linear(7, 8)}
-    ...
-    >>> graphdef, statetree = brainstate.graph.flatten(MyNode())
-    >>> statetree
-    NestedDict({
-      'a': {
-        'weight': TreefyState(
-          type=ParamState,
-          value={'weight': Array([[-0.8466386 , -2.0294454 , -0.6911647 ],
-                 [ 0.60034966, -1.1869028 ,  0.84003365]], dtype=float32), 'bias': Array([0., 0., 0.], dtype=float32)}
-        )
-      },
-      'b': {
-        'weight': TreefyState(
-          type=ParamState,
-          value={'weight': Array([[ 0.8565106 , -0.10337489],
-                 [ 1.7449658 ,  0.29128835],
-                 [ 0.11441387,  1.0012752 ]], dtype=float32), 'bias': Array([0., 0.], dtype=float32)}
-        )
-      },
-      'c': {
-        0: {
-          'weight': TreefyState(
-            type=ParamState,
-            value={'weight': Array([[ 2.4465137, -0.5711426]], dtype=float32), 'bias': Array([0., 0.], dtype=float32)}
-          )
-        },
-        1: {
-          'weight': TreefyState(
-            type=ParamState,
-            value={'weight': Array([[ 0.14321847, -2.4154725 , -0.6322363 ]], dtype=float32), 'bias': Array([0., 0., 0.], dtype=float32)}
-          )
-        }
-      },
-      'd': {
-        'x': {
-          'weight': TreefyState(
-            type=ParamState,
-            value={'weight': Array([[ 0.9647322, -0.8958757,  1.585352 ]], dtype=float32), 'bias': Array([0., 0., 0.], dtype=float32)}
-          )
-        },
-        'y': {
-          'weight': TreefyState(
-            type=ParamState,
-            value={'weight': Array([[-1.2904786 ,  0.5695903 ,  0.40079263,  0.8769669 ]], dtype=float32), 'bias': Array([0., 0., 0., 0.], dtype=float32)}
-          )
-        }
-      }
-    })
-    >>> node = brainstate.graph.unflatten(graphdef, statetree)
-    >>> node
-    MyNode(
-      a=Linear(
-        in_size=(2,),
-        out_size=(3,),
-        w_mask=None,
-        weight=ParamState(
-          value={'weight': Array([[ 0.55600464, -1.6276929 ,  0.26805446],
-                 [ 1.175099  ,  1.0077754 ,  0.37592274]], dtype=float32), 'bias': Array([0., 0., 0.], dtype=float32)},
-        )
-      ),
-      b=Linear(
-        in_size=(3,),
-        out_size=(4,),
-        w_mask=None,
-        weight=ParamState(
-          value={'weight': Array([[-0.24753566,  0.18456966, -0.29438975,  0.16891003],
-                 [-0.803741  , -0.46037054, -0.21617596,  0.1260884 ],
-                 [-0.43074366, -0.24757433,  1.2237076 , -0.07842704]],      dtype=float32), 'bias': Array([0., 0., 0., 0.], dtype=float32)},
-        )
-      ),
-      c=[Linear(
-        in_size=(4,),
-        out_size=(5,),
-        w_mask=None,
-        weight=ParamState(
-          value={'weight': Array([[-0.22384474,  0.79441446, -0.658726  ,  0.05991402,  0.3014344 ],
-                 [-1.4755846 , -0.42272082, -0.07692316,  0.03077666,  0.34513143],
-                 [-0.69395834,  0.48617035,  1.1042316 ,  0.13105175, -0.25620162],
-                 [ 0.50389856,  0.6998943 ,  0.43716812,  1.2168779 , -0.47325954]],      dtype=float32), 'bias': Array([0., 0., 0., 0., 0.], dtype=float32)},
-        )
-      ), Linear(
-        in_size=(5,),
-        out_size=(6,),
-        w_mask=None,
-        weight=ParamState(
-          value={'weight': Array([[ 0.07714394,  0.78213537,  0.6745718 , -0.22881542,  0.5523547 ,
-                  -0.6399196 ],
-                 [-0.22626828, -0.54522336,  0.07448788, -0.00464636,  1.1483842 ,
-                  -0.57049096],
-                 [-0.86659616,  0.5683135 , -0.7449975 ,  1.1862832 ,  0.15047254,
-                   0.68890226],
-                 [-1.0325443 ,  0.2658072 , -0.10083053, -0.66915905,  0.11258496,
-                   0.5440655 ],
-                 [ 0.27917263,  0.05717273, -0.5682605 , -0.88345915,  0.01314917,
-                   0.780759  ]], dtype=float32), 'bias': Array([0., 0., 0., 0., 0., 0.], dtype=float32)},
-        )
-      )],
-      d={'x': Linear(
-        in_size=(6,),
-        out_size=(7,),
-        w_mask=None,
-        weight=ParamState(
-          value={'weight': Array([[-0.24238771, -0.23202638,  0.13663477, -0.48858666,  0.80871904,
-                   0.00593298,  0.7595096 ],
-                 [ 0.50457454,  0.24180941,  0.25048748,  0.8937061 ,  0.25398138,
-                  -1.2400566 ,  0.00151599],
-                 [-0.19136038,  0.34470603, -0.11892717, -0.12514868, -0.5871703 ,
-                   0.13572927, -1.1859009 ],
-                 [-0.01580911,  0.9301295 , -1.1246226 , -0.137708  , -0.4952151 ,
-                   0.17537868,  0.98440856],
-                 [ 0.6399284 ,  0.01739843,  0.61856824,  0.93258303,  0.64012206,
-                   0.22780116, -0.5763679 ],
-                 [ 0.14077143, -1.0359222 ,  0.28072503,  0.2557584 , -0.50622064,
-                   0.4388198 , -0.26106128]], dtype=float32), 'bias': Array([0., 0., 0., 0., 0., 0., 0.], dtype=float32)},
-        )
-      ), 'y': Linear(
-        in_size=(7,),
-        out_size=(8,),
-        w_mask=None,
-        weight=ParamState(
-          value={'weight': Array([[-0.23334591, -0.2893582 ,  0.8071877 , -0.49038902, -0.29646504,
-                   0.13624157,  0.22763114,  0.01906361],
-                 [-0.26742765,  0.20136863,  0.35148615,  0.42135832,  0.06401154,
-                  -0.78036404,  0.6616062 ,  0.19437549],
-                 [ 0.9229799 , -0.1205209 ,  0.69602865,  0.9685676 , -0.99886954,
-                  -0.12649904, -0.15393028,  0.65067965],
-                 [ 0.7020109 , -0.5452006 ,  0.3649151 , -0.42368713,  0.24738027,
-                   0.29290223, -0.63721114,  0.6007214 ],
-                 [-0.45045808, -0.08538888, -0.01338054, -0.39983988,  0.4028439 ,
-                   1.0498686 , -0.24730456,  0.37612835],
-                 [ 0.16273966,  0.9001257 ,  0.15190877, -1.1129239 , -0.29441378,
-                   0.5168159 , -0.4205143 ,  0.45700482],
-                 [ 0.08611429, -0.9271384 , -0.562362  , -0.586757  ,  1.1611121 ,
-                   0.5137503 , -0.46277294,  0.84642583]], dtype=float32), 'bias': Array([0., 0., 0., 0., 0., 0., 0., 0.], dtype=float32)},
-        )
-      )}
-    )
-    Args:
-      graph_def: A GraphDef instance.
-      state_mapping: A NestedDict instance.
-      index_ref: A mapping from indexes to nodes references found during the graph
-                 traversal, defaults to None. If not provided, a new empty dictionary is
-                 created. This argument can be used to unflatten a sequence of (graphdef, state_mapping)
-                 pairs that share the same index space.
-      index_ref_cache: A mapping from indexes to existing nodes that can be reused.
-                       When a reference is reused, ``GraphNodeImpl.clear`` is called to leave the
-                       object in an empty state and then filled by the unflatten process, as a result
-                       existing graph nodes are mutated to have the new content/topology
-                       specified by the graphdef.
+    Parameters
+    ----------
+    graph_def : GraphDef
+        A GraphDef instance.
+    state_mapping : NestedDict
+        A NestedDict instance containing the state mapping.
+    index_ref : dict[Index, Any], optional
+        A mapping from indexes to nodes references found during the graph
+        traversal. If not provided, a new empty dictionary is created. This argument
+        can be used to unflatten a sequence of (graphdef, state_mapping) pairs that
+        share the same index space.
+    index_ref_cache : dict[Index, Any], optional
+        A mapping from indexes to existing nodes that can be reused. When a reference
+        is reused, ``GraphNodeImpl.clear`` is called to leave the object in an empty
+        state and then filled by the unflatten process. As a result, existing graph
+        nodes are mutated to have the new content/topology specified by the graphdef.
+    Returns
+    -------
+    Node
+        The reconstructed node.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> class MyNode(brainstate.graph.Node):
+        ...     def __init__(self):
+        ...         self.a = brainstate.nn.Linear(2, 3)
+        ...         self.b = brainstate.nn.Linear(3, 4)
+        ...
+        >>> # Flatten a node
+        >>> node = MyNode()
+        >>> graphdef, statetree = brainstate.graph.flatten(node)
+        >>>
+        >>> # Unflatten back to node
+        >>> reconstructed_node = brainstate.graph.unflatten(graphdef, statetree)
+        >>> assert isinstance(reconstructed_node, MyNode)
+        >>> assert isinstance(reconstructed_node.a, brainstate.nn.Linear)
+        >>> assert isinstance(reconstructed_node.b, brainstate.nn.Linear)
     """
     index_ref = {} if index_ref is None else index_ref
     assert isinstance(graph_def, (NodeDef, NodeRef)), f"graph_def must be a NodeDef or NodeRef. But we got: {graph_def}"
@@ -874,7 +875,7 @@ def unflatten(
 def _graph_pop(
-    node: Node,
+    node: Any,
     id_to_index: dict[int, Index],
     path_parts: PathParts,
     flatted_state_dicts: tuple[FlattedDict[PathParts, StateLeaf], ...],
@@ -922,61 +923,57 @@ def _graph_pop(
             pass
-@overload
-def pop_states(node, filter1: Filter, /) -> NestedDict:
-    ...
-@overload
-def pop_states(node, filter1: Filter, filter2: Filter, /, *filters: Filter) -> tuple[NestedDict, ...]:
-    ...
 @set_module_as('brainstate.graph')
 def pop_states(
-    node: Node,
-    *filters: Any
-) -> Union[NestedDict[Key, State], Tuple[NestedDict[Key, State], ...]]:
+    node: Any,  *filters: Any
+) -> Union[NestedDict, Tuple[NestedDict, ...]]:
     """
     Pop one or more :class:`State` types from the graph node.
-    Example usage::
-      >>> import brainstate as brainstate
-      >>> import jax.numpy as jnp
-      >>> class Model(brainstate.nn.Module):
-      ...   def __init__(self):
-      ...     super().__init__()
-      ...     self.a = brainstate.nn.Linear(2, 3)
-      ...     self.b = brainstate.nn.LIF([10, 2])
-      >>> model = Model()
-      >>> with brainstate.catch_new_states('new'):
-      ...    brainstate.nn.init_all_states(model)
-      >>> assert len(model.states()) == 2
-      >>> model_states = brainstate.graph.pop_states(model, 'new')
-      >>> model_states
-      NestedDict({
-        'b': {
-          'V': {
-            'st': ShortTermState(
-              value=Array([0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.,
-                     0., 0., 0.], dtype=float32),
-              tag='new'
-            )
+    Parameters
+    ----------
+    node : Node
+        A graph node object.
+    *filters
+        One or more :class:`State` objects to filter by.
+    Returns
+    -------
+    NestedDict or tuple[NestedDict, ...]
+        The popped :class:`NestedDict` containing the :class:`State`
+        objects that were filtered for.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> import jax.numpy as jnp
+        >>> class Model(brainstate.nn.Module):
+        ...     def __init__(self):
+        ...         super().__init__()
+        ...         self.a = brainstate.nn.Linear(2, 3)
+        ...         self.b = brainstate.nn.LIF([10, 2])
+        >>> model = Model()
+        >>> with brainstate.catch_new_states('new'):
+        ...     brainstate.nn.init_all_states(model)
+        >>> assert len(model.states()) == 2
+        >>> model_states = brainstate.graph.pop_states(model, 'new')
+        >>> model_states  # doctest: +SKIP
+        NestedDict({
+          'b': {
+            'V': {
+              'st': ShortTermState(
+                value=Array([0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.,
+                       0., 0., 0.], dtype=float32),
+                tag='new'
+              )
+            }
           }
-        }
-      })
-    Args:
-      node: A graph node object.
-      *filters: One or more :class:`State` objects to filter by.
-    Returns:
-      The popped :class:`NestedDict` containing the :class:`State`
-      objects that were filtered for.
+        })
     """
     if len(filters) == 0:
         raise ValueError('Expected at least one filter')
@@ -985,11 +982,13 @@ def pop_states(
     path_parts: PathParts = ()
     predicates = tuple(to_predicate(filter) for filter in filters)
     flatted_state_dicts: tuple[FlattedDict[PathParts, StateLeaf], ...] = tuple({} for _ in predicates)
-    _graph_pop(node=node,
-               id_to_index=id_to_index,
-               path_parts=path_parts,
-               flatted_state_dicts=flatted_state_dicts,
-               predicates=predicates, )
+    _graph_pop(
+        node=node,
+        id_to_index=id_to_index,
+        path_parts=path_parts,
+        flatted_state_dicts=flatted_state_dicts,
+        predicates=predicates,
+    )
     states = tuple(NestedDict.from_flat(flat_state) for flat_state in flatted_state_dicts)
     if len(states) == 1:
@@ -1011,94 +1010,49 @@ def _split_state(
     return states  # type: ignore[return-value]
-@overload
-def treefy_split(node: A, /) -> Tuple[GraphDef, NestedDict]:
-    ...
-@overload
-def treefy_split(node: A, first: Filter, /) -> Tuple[GraphDef, NestedDict]:
-    ...
-@overload
-def treefy_split(node: A, first: Filter, second: Filter, /) -> Tuple[GraphDef, NestedDict, NestedDict]:
-    ...
-@overload
-def treefy_split(
-    node: A, first: Filter, second: Filter, /, *filters: Filter,
-) -> Tuple[GraphDef, NestedDict, Unpack[Tuple[NestedDict, ...]]]:
-    ...
 @set_module_as('brainstate.graph')
 def treefy_split(
-    node: A,
-    *filters: Filter
-) -> Tuple[GraphDef[A], NestedDict, Unpack[Tuple[NestedDict, ...]]]:
-    """Split a graph node into a :class:`GraphDef` and one or more :class:`NestedDict`s. NestedDict is
-    a ``Mapping`` from strings or integers to ``Variables``, Arrays or nested States. GraphDef
-    contains all the static information needed to reconstruct a ``Module`` graph, it is analogous
-    to JAX’s ``PyTreeDef``. :func:`split` is used in conjunction with :func:`merge` to switch
-    seamlessly between stateful and stateless representations of the graph.
-    Example usage::
-      >>> from joblib.testing import param    >>> import brainstate as brainstate
-      >>> import jax, jax.numpy as jnp
-      ...
-      >>> class Foo(brainstate.graph.Node):
-      ...   def __init__(self):
-      ...     self.a = brainstate.nn.BatchNorm1d([10, 2])
-      ...     self.b = brainstate.nn.Linear(2, 3)
-      ...
-      >>> node = Foo()
-      >>> graphdef, params, others = brainstate.graph.treefy_split(node, brainstate.ParamState, ...)
-      ...
-      >>> params
-      NestedDict({
-        'a': {
-          'weight': TreefyState(
-            type=ParamState,
-            value={'weight': Array([[-1.0013659,  1.5763807],
-                   [ 1.7149199,  2.0140953]], dtype=float32), 'bias': Array([0., 0.], dtype=float32)}
-          )
-        },
-        'b': {
-          'weight': TreefyState(
-            type=ParamState,
-            value={'bias': Array([[0., 0.]], dtype=float32), 'scale': Array([[1., 1.]], dtype=float32)}
-          )
-        }
-      })
-      >>> jax.tree.map(jnp.shape, others)
-      NestedDict({
-        'b': {
-          'running_mean': TreefyState(
-            type=LongTermState,
-            value=(1, 2)
-          ),
-          'running_var': TreefyState(
-            type=LongTermState,
-            value=(1, 2)
-          )
-        }
-      })
-    :func:`split` and :func:`merge` are primarily used to interact directly with JAX
-    transformations, see
-    `Functional API <https://flax.readthedocs.io/en/latest/nnx/nnx_basics.html#the-functional-api>`__
-    for more information.
-    Arguments:
-      node: graph node to split.
-      *filters: some optional filters to group the state into mutually exclusive substates.
+    node: A, *filters: Filter
+):
+    """
+    Split a graph node into a :class:`GraphDef` and one or more :class:`NestedDict`s.
-    Returns:
-      ``GraphDef`` and one or more ``States`` equal to the number of filters passed. If no
-      filters are passed, a single ``NestedDict`` is returned.
+    NestedDict is a ``Mapping`` from strings or integers to ``Variables``, Arrays or nested States.
+    GraphDef contains all the static information needed to reconstruct a ``Module`` graph, it is
+    analogous to JAX's ``PyTreeDef``. :func:`split` is used in conjunction with :func:`merge` to
+    switch seamlessly between stateful and stateless representations of the graph.
+    Parameters
+    ----------
+    node : A
+        Graph node to split.
+    *filters
+        Optional filters to group the state into mutually exclusive substates.
+    Returns
+    -------
+    tuple
+        ``GraphDef`` and one or more ``States`` equal to the number of filters passed.
+        If no filters are passed, a single ``NestedDict`` is returned.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> import jax, jax.numpy as jnp
+        >>> class Foo(brainstate.graph.Node):
+        ...     def __init__(self):
+        ...         self.a = brainstate.nn.BatchNorm1d([10, 2])
+        ...         self.b = brainstate.nn.Linear(2, 3)
+        ...
+        >>> node = Foo()
+        >>> graphdef, params, others = brainstate.graph.treefy_split(
+        ...     node, brainstate.ParamState, ...
+        ... )
+        >>> # params contains ParamState variables
+        >>> # others contains all other state variables
     """
     graphdef, state_tree = flatten(node)
     states = tuple(_split_state(state_tree, filters))
@@ -1106,49 +1060,47 @@ def treefy_split(
 @set_module_as('brainstate.graph')
-def treefy_merge(
-    graphdef: GraphDef[A],
-    state_mapping: GraphStateMapping,
-    /,
-    *state_mappings: GraphStateMapping,
-) -> A:
-    """The inverse of :func:`split`.
+def treefy_merge(graphdef: GraphDef[A], *state_mappings) -> A:
+    """
+    The inverse of :func:`split`.
     ``merge`` takes a :class:`GraphDef` and one or more :class:`NestedDict`'s and creates
     a new node with the same structure as the original node.
-    Example usage::
-      >>> import brainstate as brainstate
-      >>> import jax, jax.numpy as jnp
-      ...
-      >>> class Foo(brainstate.graph.Node):
-      ...   def __init__(self):
-      ...     self.a = brainstate.nn.BatchNorm1d([10, 2])
-      ...     self.b = brainstate.nn.Linear(2, 3)
-      ...
-      >>> node = Foo()
-      >>> graphdef, params, others = brainstate.graph.treefy_split(node, brainstate.ParamState, ...)
-      ...
-      >>> new_node = brainstate.graph.treefy_merge(graphdef, params, others)
-      >>> assert isinstance(new_node, Foo)
-      >>> assert isinstance(new_node.b, brainstate.nn.BatchNorm1d)
-      >>> assert isinstance(new_node.a, brainstate.nn.Linear)
-    :func:`split` and :func:`merge` are primarily used to interact directly with JAX
-    transformations, see
-    `Functional API <https://flax.readthedocs.io/en/latest/nnx/nnx_basics.html#the-functional-api>`__
-    for more information.
-    Args:
-      graphdef: A :class:`GraphDef` object.
-      state_mapping: A :class:`NestedDict` object.
-      *state_mappings: Additional :class:`NestedDict` objects.
-    Returns:
-      The merged :class:`Module`.
+    Parameters
+    ----------
+    graphdef : GraphDef[A]
+        A :class:`GraphDef` object.
+    *state_mappings
+        Additional :class:`NestedDict` objects.
+    Returns
+    -------
+    A
+        The merged :class:`Module`.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> import jax, jax.numpy as jnp
+        >>> class Foo(brainstate.graph.Node):
+        ...     def __init__(self):
+        ...         self.a = brainstate.nn.BatchNorm1d([10, 2])
+        ...         self.b = brainstate.nn.Linear(2, 3)
+        ...
+        >>> node = Foo()
+        >>> graphdef, params, others = brainstate.graph.treefy_split(
+        ...     node, brainstate.ParamState, ...
+        ... )
+        >>> new_node = brainstate.graph.treefy_merge(graphdef, params, others)
+        >>> assert isinstance(new_node, Foo)
+        >>> assert isinstance(new_node.b, brainstate.nn.BatchNorm1d)
+        >>> assert isinstance(new_node.a, brainstate.nn.Linear)
     """
-    state_mapping = GraphStateMapping.merge(state_mapping, *state_mappings)
+    state_mapping = GraphStateMapping.merge(*state_mappings)
     node = unflatten(graphdef, state_mapping)
     return node
@@ -1186,31 +1138,27 @@ def _split_flatted(
     return flat_states
-@overload
-def nodes(node, /, allowed_hierarchy=(0, _max_int)) -> FlattedDict[Key, Node]:
-    ...
-@overload
-def nodes(node, first: Filter, /, allowed_hierarchy=(0, _max_int)) -> FlattedDict[Key, Node]:
-    ...
-@overload
-def nodes(
-    node, first: Filter, second: Filter, /, *filters: Filter, allowed_hierarchy=(0, _max_int)
-) -> Tuple[FlattedDict[Key, Node], ...]:
-    ...
 @set_module_as('brainstate.graph')
 def nodes(
-    node,
-    *filters: Filter,
-    allowed_hierarchy: Tuple[int, int] = (0, _max_int)
-) -> Union[FlattedDict[Key, Node], Tuple[FlattedDict[Key, Node], ...]]:
+    node, *filters: Filter, allowed_hierarchy: Tuple[int, int] = (0, MAX_INT)
+):
     """
     Similar to :func:`split` but only returns the :class:`NestedDict`'s indicated by the filters.
+    Parameters
+    ----------
+    node : Node
+        The node to get nodes from.
+    *filters
+        Filters to apply to the nodes.
+    allowed_hierarchy : tuple[int, int], optional
+        The allowed hierarchy levels, by default (0, MAX_INT).
+    Returns
+    -------
+    FlattedDict or tuple[FlattedDict, ...]
+        The filtered nodes.
     """
     num_filters = len(filters)
     if num_filters == 0:
@@ -1232,31 +1180,27 @@ def _states_generator(node, allowed_hierarchy) -> Iterable[Tuple[PathParts, Stat
             yield path, value
-@overload
-def states(node, /, allowed_hierarchy=(0, _max_int)) -> FlattedDict[Key, State]:
-    ...
-@overload
-def states(node, first: Filter, /, allowed_hierarchy=(0, _max_int)) -> FlattedDict[Key, State]:
-    ...
-@overload
-def states(
-    node, first: Filter, second: Filter, /, *filters: Filter, allowed_hierarchy=(0, _max_int)
-) -> tuple[FlattedDict[Key, State], ...]:
-    ...
 @set_module_as('brainstate.graph')
 def states(
-    node,
-    *filters: Filter,
-    allowed_hierarchy: Tuple[int, int] = (0, _max_int)
-) -> Union[FlattedDict[Key, State], tuple[FlattedDict[Key, State], ...]]:
+    node, *filters: Filter, allowed_hierarchy: Tuple[int, int] = (0, MAX_INT)
+) -> Union[FlattedDict, tuple[FlattedDict, ...]]:
     """
     Similar to :func:`split` but only returns the :class:`NestedDict`'s indicated by the filters.
+    Parameters
+    ----------
+    node : Node
+        The node to get states from.
+    *filters
+        Filters to apply to the states.
+    allowed_hierarchy : tuple[int, int], optional
+        The allowed hierarchy levels, by default (0, MAX_INT).
+    Returns
+    -------
+    FlattedDict or tuple[FlattedDict, ...]
+        The filtered states.
     """
     num_filters = len(filters)
     if num_filters == 0:
@@ -1272,72 +1216,60 @@ def states(
     return state_maps[:num_filters]
-@overload
-def treefy_states(
-    node, /, flatted: bool = False
-) -> NestedDict[Key, TreefyState]:
-    ...
-@overload
-def treefy_states(
-    node, first: Filter, /, flatted: bool = False
-) -> NestedDict[Key, TreefyState]:
-    ...
-@overload
-def treefy_states(
-    node, first: Filter, second: Filter, /, *filters: Filter, flatted: bool = False
-) -> Tuple[NestedDict[Key, TreefyState], ...]:
-    ...
 @set_module_as('brainstate.graph')
 def treefy_states(
     node, *filters,
-) -> NestedDict[Key, TreefyState] | tuple[NestedDict[Key, TreefyState], ...]:
+):
     """
     Similar to :func:`split` but only returns the :class:`NestedDict`'s indicated by the filters.
-    Example usage::
-      >>> import brainstate as brainstate
-      >>> class Model(brainstate.nn.Module):
-      ...   def __init__(self):
-      ...     super().__init__()
-      ...     self.l1 = brainstate.nn.Linear(2, 3)
-      ...     self.l2 = brainstate.nn.Linear(3, 4)
-      ...   def __call__(self, x):
-      ...     return self.l2(self.l1(x))
-      >>> model = Model()
-      >>> # get the learnable parameters from the batch norm and linear layer
-      >>> params = brainstate.graph.treefy_states(model, brainstate.ParamState)
-      >>> # get them separately
-      >>> params, others = brainstate.graph.treefy_states(model, brainstate.ParamState, brainstate.ShortTermState)
-      >>> # get them together
-      >>> states = brainstate.graph.treefy_states(model)
-    Args:
-      node: A graph node object.
-      *filters: One or more :class:`State` objects to filter by.
-    Returns:
-      One or more :class:`NestedDict` mappings.
+    Parameters
+    ----------
+    node : Node
+        A graph node object.
+    *filters
+        One or more :class:`State` objects to filter by.
+    Returns
+    -------
+    NestedDict or tuple of NestedDict
+        One or more :class:`NestedDict` mappings.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> class Model(brainstate.nn.Module):
+        ...     def __init__(self):
+        ...         super().__init__()
+        ...         self.l1 = brainstate.nn.Linear(2, 3)
+        ...         self.l2 = brainstate.nn.Linear(3, 4)
+        ...     def __call__(self, x):
+        ...         return self.l2(self.l1(x))
+        >>> model = Model()
+        >>> # Get the learnable parameters
+        >>> params = brainstate.graph.treefy_states(model, brainstate.ParamState)
+        >>> # Get them separately
+        >>> params, others = brainstate.graph.treefy_states(
+        ...     model, brainstate.ParamState, brainstate.ShortTermState
+        ... )
+        >>> # Get all states together
+        >>> states = brainstate.graph.treefy_states(model)
     """
     _, state_mapping = flatten(node)
-    state_mappings: GraphStateMapping | tuple[GraphStateMapping, ...]
     if len(filters) == 0:
-        state_mappings = state_mapping
-    elif len(filters) == 1:
-        state_mappings = state_mapping.filter(filters[0])
+        return state_mapping
     else:
-        state_mappings = state_mapping.filter(filters[0], filters[1], *filters[2:])
-    return state_mappings
+        state_mappings = state_mapping.filter(*filters)
+        if len(filters) == 1:
+            return state_mappings[0]
+        else:
+            return state_mappings
-def _graph_update_dynamic(node: Any, state: Mapping[Key, Any]):
+def _graph_update_dynamic(node: Any, state: Mapping) -> None:
     if not _is_node(node):
         raise RuntimeError(f'Unsupported type: {type(node)}')
@@ -1350,7 +1282,8 @@ def _graph_update_dynamic(node: Any, state: Mapping[Key, Any]):
                 raise ValueError(f'Cannot set key {key!r} on immutable node of '
                                  f'type {type(node).__name__}')
             if isinstance(value, State):
-                value = value.copy()  # TODO: chenge it to state_ref
+                # TODO: here maybe error? we should check if the state already belongs to another node?
+                value = value.to_state_ref()  # Convert to state reference for proper state management
             node_impl.set_key(node, key, value)
             continue
@@ -1379,18 +1312,23 @@ def _graph_update_dynamic(node: Any, state: Mapping[Key, Any]):
 def update_states(
-    node: Node,
-    state_dict: NestedDict | FlattedDict,
+    node: Any,
+    state_dict: Union[NestedDict, FlattedDict],
     /,
-    *state_dicts: NestedDict | FlattedDict
+    *state_dicts: Union[NestedDict, FlattedDict]
 ) -> None:
     """
     Update the given graph node with a new :class:`NestedMapping` in-place.
-    Args:
-      node: A graph node to update.
-      state_dict: A :class:`NestedMapping` object.
-      *state_dicts: Additional :class:`NestedMapping` objects.
+    Parameters
+    ----------
+    node : Node
+        A graph node to update.
+    state_dict : NestedDict | FlattedDict
+        A :class:`NestedMapping` object.
+    *state_dicts : NestedDict | FlattedDict
+        Additional :class:`NestedMapping` objects.
     """
     if state_dicts:
         state_dict = NestedDict.merge(state_dict, *state_dicts)
@@ -1398,177 +1336,110 @@ def update_states(
 @set_module_as('brainstate.graph')
-def graphdef(node: Any, /) -> GraphDef[Any]:
-    """Get the :class:`GraphDef` of the given graph node.
+def graphdef(node: Any) -> GraphDef[Any]:
+    """
+    Get the :class:`GraphDef` of the given graph node.
+    Parameters
+    ----------
+    node : Any
+        A graph node object.
-    Example usage::
+    Returns
+    -------
+    GraphDef[Any]
+        The :class:`GraphDef` of the :class:`Module` object.
-      >>> import brainstate as brainstate
+    Examples
+    --------
+    .. code-block:: python
-      >>> model = brainstate.nn.Linear(2, 3)
-      >>> graphdef, _ = brainstate.graph.treefy_split(model)
-      >>> assert graphdef == brainstate.graph.graphdef(model)
+        >>> import brainstate
-    Args:
-      node: A graph node object.
+        >>> model = brainstate.nn.Linear(2, 3)
+        >>> graphdef, _ = brainstate.graph.treefy_split(model)
+        >>> assert graphdef == brainstate.graph.graphdef(model)
-    Returns:
-      The :class:`GraphDef` of the :class:`Module` object.
     """
     graphdef, _ = flatten(node)
     return graphdef
 @set_module_as('brainstate.graph')
-def clone(node: Node) -> Node:
+def clone(node: A) -> A:
     """
     Create a deep copy of the given graph node.
-    Example usage::
+    Parameters
+    ----------
+    node : Node
+        A graph node object.
-      >>> import brainstate as brainstate
-      >>> model = brainstate.nn.Linear(2, 3)
-      >>> cloned_model = clone(model)
-      >>> model.weight.value['bias'] += 1
-      >>> assert (model.weight.value['bias'] != cloned_model.weight.value['bias']).all()
+    Returns
+    -------
+    Node
+        A deep copy of the :class:`Module` object.
-    Args:
-      node: A graph node object.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> model = brainstate.nn.Linear(2, 3)
+        >>> cloned_model = brainstate.graph.clone(model)
+        >>> model.weight.value['bias'] += 1
+        >>> assert (model.weight.value['bias'] != cloned_model.weight.value['bias']).all()
-    Returns:
-      A deep copy of the :class:`Module` object.
     """
     graphdef, state = treefy_split(node)
     return treefy_merge(graphdef, state)
-@set_module_as('brainstate.graph')
-def call(
-    graphdef_state: Tuple[GraphDef[A], GraphStateMapping],
-) -> ApplyCaller[Tuple[GraphDef[A], GraphStateMapping]]:
-    """Calls a method underlying graph node defined by a (GraphDef, NestedDict) pair.
-    ``call`` takes a ``(GraphDef, NestedDict)`` pair and creates a proxy object that can be
-    used to call methods on the underlying graph node. When a method is called, the
-    output is returned along with a new (GraphDef, NestedDict) pair that represents the
-    updated state of the graph node. ``call`` is equivalent to :func:`merge` > ``method``
-    > :func:`split`` but is more convenient to use in pure JAX functions.
-    Example::
-      >>> import brainstate as brainstate
-      >>> import jax
-      >>> import jax.numpy as jnp
-      ...
-      >>> class StatefulLinear(brainstate.graph.Node):
-      ...   def __init__(self, din, dout):
-      ...     self.w = brainstate.ParamState(brainstate.random.rand(din, dout))
-      ...     self.b = brainstate.ParamState(jnp.zeros((dout,)))
-      ...     self.count = brainstate.State(jnp.array(0, dtype=jnp.uint32))
-      ...
-      ...   def increment(self):
-      ...     self.count.value += 1
-      ...
-      ...   def __call__(self, x):
-      ...     self.increment()
-      ...     return x @ self.w.value + self.b.value
-      ...
-      >>> linear = StatefulLinear(3, 2)
-      >>> linear_state = brainstate.graph.treefy_split(linear)
-      ...
-      >>> @jax.jit
-      ... def forward(x, linear_state):
-      ...   y, linear_state = brainstate.graph.call(linear_state)(x)
-      ...   return y, linear_state
-      ...
-      >>> x = jnp.ones((1, 3))
-      >>> y, linear_state = forward(x, linear_state)
-      >>> y, linear_state = forward(x, linear_state)
-      ...
-      >>> linear = brainstate.graph.treefy_merge(*linear_state)
-      >>> linear.count.value
-      Array(2, dtype=uint32)
-    The proxy object returned by ``call`` supports indexing and attribute access
-    to access nested methods. In the example below, the ``increment`` method indexing
-    is used to call the ``increment`` method of the ``StatefulLinear`` module
-    at the ``b`` key of a ``nodes`` dictionary.
-      >>> class StatefulLinear(brainstate.graph.Node):
-      ...   def __init__(self, din, dout):
-      ...     self.w = brainstate.ParamState(brainstate.random.rand(din, dout))
-      ...     self.b = brainstate.ParamState(jnp.zeros((dout,)))
-      ...     self.count = brainstate.State(jnp.array(0, dtype=jnp.uint32))
-      ...
-      ...   def increment(self):
-      ...     self.count.value += 1
-      ...
-      ...   def __call__(self, x):
-      ...     self.increment()
-      ...     return x @ self.w.value + self.b.value
-      ...
-      >>> nodes = dict(
-      ...   a=StatefulLinear(3, 2),
-      ...   b=StatefulLinear(2, 1),
-      ... )
-      ...
-      >>> node_state = treefy_split(nodes)
-      >>> # use attribute access
-      >>> _, node_state = brainstate.graph.call(node_state)['b'].increment()
-      ...
-      >>> nodes = treefy_merge(*node_state)
-      >>> nodes['a'].count.value
-      Array(0, dtype=uint32)
-      >>> nodes['b'].count.value
-      Array(1, dtype=uint32)
-    """
-    def pure_caller(accessor: DelayedAccessor, *args, **kwargs):
-        node = treefy_merge(*graphdef_state)
-        method = accessor(node)
-        out = method(*args, **kwargs)
-        return out, treefy_split(node)
-    return CallableProxy(pure_caller)  # type: ignore
 @set_module_as('brainstate.graph')
 def iter_leaf(
-    node: Any,
-    allowed_hierarchy: Tuple[int, int] = (0, _max_int)
+    node: Any, allowed_hierarchy: Tuple[int, int] = (0, MAX_INT)
 ) -> Iterator[tuple[PathParts, Any]]:
-    """Iterates over all nested leaves in the given graph node, including the current node.
+    """
+    Iterates over all nested leaves in the given graph node, including the current node.
     ``iter_graph`` creates a generator that yields path and value pairs, where
     the path is a tuple of strings or integers representing the path to the value from the
     root. Repeated nodes are visited only once. Leaves include static values.
-    Example::
-      >>> import brainstate as brainstate
-      >>> import jax.numpy as jnp
-      ...
-      >>> class Linear(brainstate.nn.Module):
-      ...   def __init__(self, din, dout):
-      ...     super().__init__()
-      ...     self.weight = brainstate.ParamState(brainstate.random.randn(din, dout))
-      ...     self.bias = brainstate.ParamState(brainstate.random.randn(dout))
-      ...     self.a = 1
-      ...
-      >>> module = Linear(3, 4)
-      ...
-      >>> for path, value in brainstate.graph.iter_leaf([module, module]):
-      ...   print(path, type(value).__name__)
-      ...
-      (0, 'a') int
-      (0, 'bias') ParamState
-      (0, 'weight') ParamState
     Parameters
     ----------
-    node: Node
-      The node to iterate over.
-    allowed_hierarchy: tuple of int
-      The allowed hierarchy.
+    node : Any
+        The node to iterate over.
+    allowed_hierarchy : tuple[int, int], optional
+        The allowed hierarchy levels, by default (0, MAX_INT).
+    Yields
+    ------
+    Iterator[tuple[PathParts, Any]]
+        Path and value pairs.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> import jax.numpy as jnp
+        >>> class Linear(brainstate.nn.Module):
+        ...     def __init__(self, din, dout):
+        ...         super().__init__()
+        ...         self.weight = brainstate.ParamState(brainstate.random.randn(din, dout))
+        ...         self.bias = brainstate.ParamState(brainstate.random.randn(dout))
+        ...         self.a = 1
+        ...
+        >>> module = Linear(3, 4)
+        ...
+        >>> for path, value in brainstate.graph.iter_leaf([module, module]):
+        ...     print(path, type(value).__name__)
+        ...
+        (0, 'a') int
+        (0, 'bias') ParamState
+        (0, 'weight') ParamState
     """
@@ -1605,8 +1476,7 @@ def iter_leaf(
 @set_module_as('brainstate.graph')
 def iter_node(
-    node: Any,
-    allowed_hierarchy: Tuple[int, int] = (0, _max_int)
+    node: Any, allowed_hierarchy: Tuple[int, int] = (0, MAX_INT)
 ) -> Iterator[Tuple[PathParts, Any]]:
     """
     Iterates over all nested nodes of the given graph node, including the current node.
@@ -1615,39 +1485,47 @@ def iter_node(
     the path is a tuple of strings or integers representing the path to the value from the
     root. Repeated nodes are visited only once. Leaves include static values.
-    Example::
-      >>> import brainstate as brainstate
-      >>> import jax.numpy as jnp
-      ...
-      >>> class Model(brainstate.nn.Module):
-      ...   def __init__(self):
-      ...     super().__init__()
-      ...     self.a = brainstate.nn.Linear(1, 2)
-      ...     self.b = brainstate.nn.Linear(2, 3)
-      ...     self.c = [brainstate.nn.Linear(3, 4), brainstate.nn.Linear(4, 5)]
-      ...     self.d = {'x': brainstate.nn.Linear(5, 6), 'y': brainstate.nn.Linear(6, 7)}
-      ...     self.b.a = brainstate.nn.LIF(2)
-      ...
-      >>> model = Model()
-      ...
-      >>> for path, node in brainstate.graph.iter_node([model, model]):
-      ...    print(path, node.__class__.__name__)
-      ...
-      (0, 'a') Linear
-      (0, 'b', 'a') LIF
-      (0, 'b') Linear
-      (0, 'c', 0) Linear
-      (0, 'c', 1) Linear
-      (0, 'd', 'x') Linear
-      (0, 'd', 'y') Linear
-      (0,) Model
     Parameters
     ----------
-    node: Node
-      The node to iterate over.
-    allowed_hierarchy: tuple of int
-      The allowed hierarchy.
+    node : Any
+        The node to iterate over.
+    allowed_hierarchy : tuple[int, int], optional
+        The allowed hierarchy levels, by default (0, MAX_INT).
+    Yields
+    ------
+    Iterator[tuple[PathParts, Any]]
+        Path and node pairs.
+    Examples
+    --------
+    .. code-block:: python
+        >>> import brainstate
+        >>> import jax.numpy as jnp
+        >>> class Model(brainstate.nn.Module):
+        ...     def __init__(self):
+        ...         super().__init__()
+        ...         self.a = brainstate.nn.Linear(1, 2)
+        ...         self.b = brainstate.nn.Linear(2, 3)
+        ...         self.c = [brainstate.nn.Linear(3, 4), brainstate.nn.Linear(4, 5)]
+        ...         self.d = {'x': brainstate.nn.Linear(5, 6), 'y': brainstate.nn.Linear(6, 7)}
+        ...         self.b.a = brainstate.nn.LIF(2)
+        ...
+        >>> model = Model()
+        ...
+        >>> for path, node in brainstate.graph.iter_node([model, model]):
+        ...     print(path, node.__class__.__name__)
+        ...
+        (0, 'a') Linear
+        (0, 'b', 'a') LIF
+        (0, 'b') Linear
+        (0, 'c', 0) Linear
+        (0, 'c', 1) Linear
+        (0, 'd', 'x') Linear
+        (0, 'd', 'y') Linear
+        (0,) Model
     """
@@ -1686,8 +1564,16 @@ def iter_node(
 @dataclasses.dataclass(frozen=True)
 class Static(Generic[A]):
-    """An empty pytree node that treats its inner value as static.
+    """
+    An empty pytree node that treats its inner value as static.
     ``value`` must define ``__eq__`` and ``__hash__``.
+    Attributes
+    ----------
+    value : A
+        The static value to wrap.
     """
     value: A
@@ -1721,16 +1607,16 @@ def _key_path_to_key(key: Any) -> Key:
         return str(key)
-def _flatten_pytree(pytree: Any):
+def _flatten_pytree(pytree: Any) -> Tuple[Tuple[Tuple, ...], jax.tree_util.PyTreeDef]:
     leaves, treedef = jax.tree_util.tree_flatten_with_path(pytree, is_leaf=lambda x: x is not pytree)
     nodes = tuple((_key_path_to_key(path[0]), value) for path, value in leaves)
     return nodes, treedef
 def _unflatten_pytree(
-    nodes: tuple[tuple[Key, Any], ...],
+    nodes: tuple[tuple, ...],
     treedef: jax.tree_util.PyTreeDef
-):
+) -> Any:
     pytree = treedef.unflatten(value for _, value in nodes)
     return pytree

brainstate 0.1.9__py2.py3-none-any.whl → 0.2.0__py2.py3-none-any.whl

brainstate 0.1.9py2.py3-none-any.whl → 0.2.0py2.py3-none-any.whl