PyPI - brainstate - Versions diffs - 0.1.0.post20250105__py2.py3-none-any.whl → 0.1.0.post20250120__py2.py3-none-any.whl - Mend

brainstate 0.1.0.post20250105py2.py3-none-any.whl → 0.1.0.post20250120py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (46) hide show

brainstate/_state.py +77 -44
brainstate/_state_test.py +0 -17
brainstate/augment/_eval_shape.py +9 -10
brainstate/augment/_eval_shape_test.py +1 -1
brainstate/augment/_mapping.py +265 -277
brainstate/augment/_mapping_test.py +147 -175
brainstate/compile/_ad_checkpoint.py +6 -4
brainstate/compile/_jit.py +37 -28
brainstate/compile/_loop_collect_return.py +6 -3
brainstate/compile/_loop_no_collection.py +2 -0
brainstate/compile/_make_jaxpr.py +7 -3
brainstate/compile/_progress_bar.py +68 -40
brainstate/compile/_unvmap.py +6 -3
brainstate/event/__init__.py +0 -2
brainstate/event/_csr.py +266 -23
brainstate/event/_csr_test.py +187 -0
brainstate/event/_xla_custom_op.py +7 -3
brainstate/graph/__init__.py +8 -12
brainstate/graph/_graph_node.py +1 -23
brainstate/graph/_graph_operation.py +1 -1
brainstate/graph/_graph_operation_test.py +0 -159
brainstate/nn/_dyn_impl/_inputs.py +124 -39
brainstate/nn/_interaction/_conv.py +4 -2
brainstate/nn/_interaction/_linear.py +84 -10
brainstate/random/_rand_funs.py +9 -2
brainstate/random/_rand_seed.py +12 -2
brainstate/random/_rand_state.py +50 -179
brainstate/surrogate.py +5 -1
brainstate/util/__init__.py +0 -4
brainstate/util/_caller.py +1 -1
brainstate/util/_dict.py +4 -1
brainstate/util/_filter.py +1 -1
brainstate/util/_pretty_repr.py +1 -1
brainstate/util/_struct.py +1 -1
{brainstate-0.1.0.post20250105.dist-info → brainstate-0.1.0.post20250120.dist-info}/METADATA +2 -1
{brainstate-0.1.0.post20250105.dist-info → brainstate-0.1.0.post20250120.dist-info}/RECORD +40 -46
brainstate/event/_csr_mv_test.py +0 -118
brainstate/graph/_graph_context.py +0 -443
brainstate/graph/_graph_context_test.py +0 -65
brainstate/graph/_graph_convert.py +0 -246
brainstate/util/_tracers.py +0 -68
brainstate/util/_visualization.py +0 -47
/brainstate/event/{_csr_mv_benchmark.py → _csr_benchmark.py} +0 -0
{brainstate-0.1.0.post20250105.dist-info → brainstate-0.1.0.post20250120.dist-info}/LICENSE +0 -0
{brainstate-0.1.0.post20250105.dist-info → brainstate-0.1.0.post20250120.dist-info}/WHEEL +0 -0
{brainstate-0.1.0.post20250105.dist-info → brainstate-0.1.0.post20250120.dist-info}/top_level.txt +0 -0

brainstate/compile/_progress_bar.py CHANGED Viewed

@@ -16,34 +16,59 @@
 from __future__ import annotations
 import copy
-from typing import Optional
+import importlib.util
+from typing import Optional, Callable, Any, Tuple, Dict
 import jax
-try:
-    from tqdm.auto import tqdm
-except (ImportError, ModuleNotFoundError):
-    tqdm = None
+tqdm_installed = importlib.util.find_spec('tqdm') is not None
 __all__ = [
     'ProgressBar',
 ]
+Index = int
+Carray = Any
+Output = Any
 class ProgressBar(object):
+    """
+    A progress bar for tracking the progress of a jitted for-loop computation.
+    """
     __module__ = "brainstate.compile"
-    def __init__(self, freq: Optional[int] = None, count: Optional[int] = None, **kwargs):
+    def __init__(
+        self,
+        freq: Optional[int] = None,
+        count: Optional[int] = None,
+        desc: Optional[Tuple[str, Callable[[Dict], Dict]]] = None,
+        **kwargs
+    ):
+        # print rate
         self.print_freq = freq
         if isinstance(freq, int):
             assert freq > 0, "Print rate should be > 0."
+        # print count
         self.print_count = count
         if self.print_freq is not None and self.print_count is not None:
             raise ValueError("Cannot specify both count and freq.")
+        # other parameters
         for kwarg in ("total", "mininterval", "maxinterval", "miniters"):
             kwargs.pop(kwarg, None)
         self.kwargs = kwargs
-        if tqdm is None:
+        # description
+        if desc is not None:
+            assert isinstance(desc, (tuple, list)), 'Description should be a tuple or list.'
+            assert isinstance(desc[0], str), 'Description should be a string.'
+            assert callable(desc[1]), 'Description should be a callable.'
+        self.desc = desc
+        # check if tqdm is installed
+        if not tqdm_installed:
             raise ImportError("tqdm is not installed.")
     def init(self, n: int):
@@ -67,15 +92,22 @@ class ProgressBar(object):
                 raise ValueError("Print rate should be less than the "
                                  f"number of steps {n}, got {freq}")
             remainder = n % freq
-        desc = kwargs.pop("desc", f"Running for {n:,} iterations")
-        message = kwargs.pop("message", desc)
-        return ProgressBarRunner(n, message, freq, remainder, **kwargs)
+        message = f"Running for {n:,} iterations" if self.desc is None else self.desc
+        return ProgressBarRunner(n, freq, remainder, message, **kwargs)
 class ProgressBarRunner(object):
     __module__ = "brainstate.compile"
-    def __init__(self, n: int, message, print_freq: int, remainder: int, **kwargs):
+    def __init__(
+        self,
+        n: int,
+        print_freq: int,
+        remainder: int,
+        message: str | Tuple[str, Callable[[Dict], Dict]],
+        **kwargs
+    ):
         self.tqdm_bars = {}
         self.kwargs = kwargs
         self.n = n
@@ -83,50 +115,46 @@ class ProgressBarRunner(object):
         self.remainder = remainder
         self.message = message
-    def _define_tqdm(self):
+    def _define_tqdm(self, x: dict):
+        from tqdm.auto import tqdm
         self.tqdm_bars[0] = tqdm(range(self.n), **self.kwargs)
-        self.tqdm_bars[0].set_description(self.message, refresh=False)
+        if isinstance(self.message, str):
+            self.tqdm_bars[0].set_description(self.message, refresh=False)
+        else:
+            self.tqdm_bars[0].set_description(self.message[0].format(**x), refresh=True)
-    def _update_tqdm(self):
+    def _update_tqdm(self, x: dict):
         self.tqdm_bars[0].update(self.print_freq)
+        if not isinstance(self.message, str):
+            self.tqdm_bars[0].set_description(self.message[0].format(**x), refresh=True)
-    def _close_tqdm(self):
+    def _close_tqdm(self, x: dict):
         if self.remainder > 0:
             self.tqdm_bars[0].update(self.remainder)
+            if not isinstance(self.message, str):
+                self.tqdm_bars[0].set_description(self.message[0].format(**x), refresh=True)
         self.tqdm_bars[0].close()
-    def _tqdm(self, is_init, is_print, is_final):
-        if is_init:
-            self.tqdm_bars[0] = tqdm(range(self.n), **self.kwargs)
-            self.tqdm_bars[0].set_description(self.message, refresh=False)
-        if is_print:
-            self.tqdm_bars[0].update(self.print_freq)
-        if is_final:
-            if self.remainder > 0:
-                self.tqdm_bars[0].update(self.remainder)
-            self.tqdm_bars[0].close()
-    def __call__(self, iter_num, *args, **kwargs):
-        # jax.debug.callback(
-        #     self._tqdm,
-        #     iter_num == 0,
-        #     (iter_num + 1) % self.print_freq == 0,
-        #     iter_num == self.n - 1
-        # )
+    def __call__(self, iter_num, **kwargs):
+        data = dict(i=iter_num, **kwargs)
+        data = dict() if isinstance(self.message, str) else self.message[1](data)
+        assert isinstance(data, dict), 'Description function should return a dictionary.'
         _ = jax.lax.cond(
             iter_num == 0,
-            lambda: jax.debug.callback(self._define_tqdm, ordered=True),
-            lambda: None,
+            lambda x: jax.debug.callback(self._define_tqdm, x, ordered=True),
+            lambda x: None,
+            data
         )
         _ = jax.lax.cond(
             iter_num % self.print_freq == (self.print_freq - 1),
-            lambda: jax.debug.callback(self._update_tqdm, ordered=True),
-            lambda: None,
+            lambda x: jax.debug.callback(self._update_tqdm, x, ordered=True),
+            lambda x: None,
+            data
         )
         _ = jax.lax.cond(
             iter_num == self.n - 1,
-            lambda: jax.debug.callback(self._close_tqdm, ordered=True),
-            lambda: None,
+            lambda x: jax.debug.callback(self._close_tqdm, x, ordered=True),
+            lambda x: None,
+            data
         )

brainstate/compile/_unvmap.py CHANGED Viewed

@@ -16,13 +16,16 @@ from __future__ import annotations
 import jax
 import jax.core
-import jax.extend as je
 import jax.interpreters.batching as batching
 import jax.interpreters.mlir as mlir
 import jax.numpy as jnp
 from brainstate._utils import set_module_as
+if jax.__version_info__ < (0, 4, 38):
+    from jax.core import Primitive
+else:
+    from jax.extend.core import Primitive
 __all__ = [
     "unvmap",
 ]
@@ -44,7 +47,7 @@ def unvmap(x, op: str = 'any'):
 # unvmap_all
-unvmap_all_p = je.core.Primitive("unvmap_all")
+unvmap_all_p = Primitive("unvmap_all")
 def unvmap_all(x):

brainstate/event/__init__.py CHANGED Viewed

@@ -15,13 +15,11 @@
 from ._csr import *
-from ._csr_mv import *
 from ._fixedprob_mv import *
 from ._linear_mv import *
 from ._xla_custom_op import *
 __all__ = [
-    'CSRLinear',
     'FixedProb',
     'XLACustomOp',
     'CSR',

brainstate/event/_csr.py CHANGED Viewed

@@ -73,7 +73,7 @@ class CSR(u.sparse.SparseMatrix):
         return u.sparse.csr_todense(self)
     def transpose(self, axes=None):
-        assert axes is None
+        assert axes is None, "transpose does not support axes argument."
         return CSC((self.data, self.indices, self.indptr), shape=self.shape[::-1])
     def __abs__(self):
@@ -103,6 +103,7 @@ class CSR(u.sparse.SparseMatrix):
                 (op(self.data, other), self.indices, self.indptr),
                 shape=self.shape
             )
         elif other.ndim == 2 and other.shape == self.shape:
             rows, cols = csr_to_coo(self.indices, self.indptr)
             other = other[rows, cols]
@@ -112,6 +113,7 @@ class CSR(u.sparse.SparseMatrix):
                  self.indptr),
                 shape=self.shape
             )
         else:
             raise NotImplementedError(f"mul with object of shape {other.shape}")
@@ -184,10 +186,12 @@ class CSR(u.sparse.SparseMatrix):
         return self._binary_rop(other, operator.mod)
     def __matmul__(self, other):
+        # csr @ other
         if isinstance(other, JAXSparse):
             raise NotImplementedError("matmul between two sparse objects.")
         other = u.math.asarray(other)
-        data, other = u.math.promote_dtypes(self.data, other)
+        data = self.data
+        # data, other = u.math.promote_dtypes(self.data, other)
         if other.ndim == 1:
             return _csr_matvec(
                 data,
@@ -208,10 +212,12 @@ class CSR(u.sparse.SparseMatrix):
             raise NotImplementedError(f"matmul with object of shape {other.shape}")
     def __rmatmul__(self, other):
+        # other @ csr
         if isinstance(other, JAXSparse):
             raise NotImplementedError("matmul between two sparse objects.")
         other = u.math.asarray(other)
-        data, other = u.math.promote_dtypes(self.data, other)
+        data = self.data
+        # data, other = u.math.promote_dtypes(self.data, other)
         if other.ndim == 1:
             return _csr_matvec(
                 data,
@@ -566,7 +572,7 @@ def event_csrmv_cpu_kernel_generator(
     if weight_info.size == 1:
         if transpose:
             if spike_info.dtype == jnp.bool_:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     w = weights[()]
@@ -576,7 +582,7 @@ def event_csrmv_cpu_kernel_generator(
                                 posts[indices[j]] += w
             elif float_as_event:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     w = weights[()]
@@ -586,7 +592,7 @@ def event_csrmv_cpu_kernel_generator(
                                 posts[indices[j]] += w
             else:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     w = weights[()]
@@ -599,7 +605,7 @@ def event_csrmv_cpu_kernel_generator(
         else:
             if spike_info.dtype == jnp.bool_:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     w = weights[()]
                     for i in range(indptr.shape[0] - 1):
@@ -610,7 +616,7 @@ def event_csrmv_cpu_kernel_generator(
                         posts[i] = r
             elif float_as_event:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     w = weights[()]
                     for i in range(indptr.shape[0] - 1):
@@ -621,7 +627,7 @@ def event_csrmv_cpu_kernel_generator(
                         posts[i] = r
             else:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     w = weights[()]
                     for i in range(indptr.shape[0] - 1):
@@ -635,7 +641,7 @@ def event_csrmv_cpu_kernel_generator(
     else:
         if transpose:
             if spike_info.dtype == jnp.bool_:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     for i in range(v.shape[0]):
@@ -644,7 +650,7 @@ def event_csrmv_cpu_kernel_generator(
                                 posts[indices[j]] += weights[j]
             elif float_as_event:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     for i in range(v.shape[0]):
@@ -653,7 +659,7 @@ def event_csrmv_cpu_kernel_generator(
                                 posts[indices[j]] += weights[j]
             else:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     for i in range(v.shape[0]):
@@ -664,7 +670,7 @@ def event_csrmv_cpu_kernel_generator(
         else:
             if spike_info.dtype == jnp.bool_:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     for i in range(indptr.shape[0] - 1):
                         r = 0.
@@ -674,7 +680,7 @@ def event_csrmv_cpu_kernel_generator(
                         posts[i] = r
             elif float_as_event:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     for i in range(indptr.shape[0] - 1):
                         r = 0.
@@ -684,7 +690,7 @@ def event_csrmv_cpu_kernel_generator(
                         posts[i] = r
             else:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     for i in range(indptr.shape[0] - 1):
                         r = 0.
@@ -795,7 +801,31 @@ def event_csrmv_transpose_rule(
 def event_csrmv_batching(args, axes, **kwargs):
     if tuple(axes) == (None, None, None, 0):
-        return 0, event_csrmm_p_call(*args, **kwargs)
+        assert args[3].ndim == 2, 'Batching axis 0 requires 2D input.'
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            args[3].T,
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        return r, [1]
+    elif tuple(axes) == (None, None, None, 1):
+        assert args[3].ndim == 2, 'Batching axis 0 requires 2D input.'
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            args[3],
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        return r, [1]
     else:
         raise NotImplementedError(f"Batching axes {axes} not implemented for event-driven CSR matrix-vector product.")
@@ -852,17 +882,228 @@ def event_csrmv_p_call(
 def event_csrmm_batching(args, axes, **kwargs):
     if tuple(axes) == (None, None, None, 0):
-        batch_shape = args[3].shape[:-1]
-        B = jnp.reshape(args[3], (-1, args[3].shape[-1:]))
-        r = event_csrmm_p_call(args[0], args[1], args[2], B, **kwargs)
-        return 0, [jnp.reshape(r[0], batch_shape + r.shape[-1:])]
+        assert args[3].ndim == 3, 'Batching axis 0 requires 3D input.'
+        batch_size, m, n = args[3].shape
+        B = jnp.transpose(args[3], (1, 0, 2)).reshape(m, batch_size * n)
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            B,
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        r = jnp.reshape(r[0], [r[0].shape[0], batch_size, n])
+        return [r], [1]
+    elif tuple(axes) == (None, None, None, 1):
+        assert args[3].ndim == 3, 'Batching axis 0 requires 3D input.'
+        m, batch_size, n = args[3].shape
+        B = args[3].reshape(m, batch_size * n)
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            B,
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        r = jnp.reshape(r[0], [r[0].shape[0], batch_size, n])
+        return [r], [1]
+    elif tuple(axes) == (None, None, None, 2):
+        assert args[3].ndim == 3, 'Batching axis 0 requires 3D input.'
+        m, n, batch_size = args[3].shape
+        B = args[3].reshape(m, batch_size * n)
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            B,
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        r = jnp.reshape(r[0], [r[0].shape[0], n, batch_size])
+        return [r], [2]
     else:
         raise NotImplementedError(f"Batching axes {axes} not implemented for event-driven CSR matrix-vector product.")
+def event_csrmm_cpu_kernel_generator(
+    float_as_event: bool,
+    weight_info: jax.ShapeDtypeStruct,
+    spike_info: jax.ShapeDtypeStruct,
+    transpose: bool,
+    **kwargs
+) -> Kernel:
+    import numba  # pylint: disable=import-outside-toplevel
+    if weight_info.size == 1:
+        if transpose:
+            # csr.T @ B
+            if spike_info.dtype == jnp.bool_:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    w = weights[()]
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            if B[i, k]:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += w
+            elif float_as_event:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    B = B != 0.
+                    w = weights[()]
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            if B[i, k]:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += w
+            else:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    w = weights[()]
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            sp = B[i, k]
+                            if sp != 0.:
+                                wsp = w * sp
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += wsp
+        else:
+            # csr @ B
+            if spike_info.dtype == jnp.bool_:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    w = weights[()]
+                    for i in range(indptr.shape[0] - 1):
+                        r = np.zeros(B.shape[1], dtype=weights.dtype)
+                        for j in range(indptr[i], indptr[i + 1]):
+                            index = indices[j]
+                            for k in range(B.shape[1]):
+                                if B[index, k]:
+                                    r[k] += w
+                        posts[i] = r
+            elif float_as_event:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    w = weights[()]
+                    B = B != 0.
+                    for i in range(indptr.shape[0] - 1):
+                        r = np.zeros(B.shape[1], dtype=weights.dtype)
+                        for j in range(indptr[i], indptr[i + 1]):
+                            index = indices[j]
+                            for k in range(B.shape[1]):
+                                if B[index, k]:
+                                    r[k] += w
+                        posts[i] = r
+            else:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    w = weights[()]
+                    for i in range(indptr.shape[0] - 1):
+                        for k in range(B.shape[1]):
+                            r = 0.
+                            for j in range(indptr[i], indptr[i + 1]):
+                                c = B[indices[j], k]
+                                if c != 0.:
+                                    r += w * c
+                            posts[i, k] = r
+    else:
+        if transpose:
+            # csr.T @ B
+            if spike_info.dtype == jnp.bool_:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            if B[i, k]:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += weights[j]
+            elif float_as_event:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    B = B != 0.
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            if B[i, k]:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += weights[j]
+            else:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            sp = B[i, k]
+                            if sp != 0.:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += weights[j] * sp
+        else:
+            # csr @ B
+            if spike_info.dtype == jnp.bool_:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    for i in range(indptr.shape[0] - 1):
+                        for k in range(B.shape[1]):
+                            r = 0.
+                            for j in range(indptr[i], indptr[i + 1]):
+                                if B[indices[j], k]:
+                                    r += weights[j]
+                            posts[i, k] = r
+            elif float_as_event:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    B = B != 0.
+                    for i in range(indptr.shape[0] - 1):
+                        for k in range(B.shape[1]):
+                            r = 0.
+                            for j in range(indptr[i], indptr[i + 1]):
+                                if B[indices[j], k]:
+                                    r += weights[j]
+                            posts[i, k] = r
+            else:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    for i in range(indptr.shape[0] - 1):
+                        for k in range(B.shape[1]):
+                            r = 0.
+                            for j in range(indptr[i], indptr[i + 1]):
+                                c = B[indices[j], k]
+                                if c != 0.:
+                                    r += weights[j] * c
+                            posts[i, k] = r
+    return mv
 event_csrmm_p = XLACustomOp(
     'event_csrmm',
-    cpu_kernel_or_generator=event_csrmv_cpu_kernel_generator,
+    cpu_kernel_or_generator=event_csrmm_cpu_kernel_generator,
 )
 event_csrmm_p.def_batching_rule(event_csrmm_batching)
@@ -884,11 +1125,13 @@ def event_csrmm_p_call(
             indptr,
             B,
             outs=[
-                jax.ShapeDtypeStruct([shape[0], B.shape[1]], weights.dtype)
+                jax.ShapeDtypeStruct([shape[1], B.shape[1]], weights.dtype)
                 if transpose else
-                jax.ShapeDtypeStruct([shape[1], B.shape[1]], weights.dtype),
+                jax.ShapeDtypeStruct([shape[0], B.shape[1]], weights.dtype),
             ],
             # block_size=block_size,
+            shape=shape,
+            transpose=transpose,
             float_as_event=float_as_event,
             weight_info=jax.ShapeDtypeStruct(weights.shape, weights.dtype),
             spike_info=jax.ShapeDtypeStruct(B.shape, B.dtype),

brainstate 0.1.0.post20250105__py2.py3-none-any.whl → 0.1.0.post20250120__py2.py3-none-any.whl

brainstate 0.1.0.post20250105py2.py3-none-any.whl → 0.1.0.post20250120py2.py3-none-any.whl