PyPI - brainstate - Versions diffs - 0.1.0.post20250104__py2.py3-none-any.whl → 0.1.0.post20250120__py2.py3-none-any.whl - Mend

brainstate 0.1.0.post20250104py2.py3-none-any.whl → 0.1.0.post20250120py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

brainstate/_state.py +77 -44
brainstate/_state_test.py +0 -17
brainstate/augment/_eval_shape.py +9 -10
brainstate/augment/_eval_shape_test.py +1 -1
brainstate/augment/_mapping.py +265 -277
brainstate/augment/_mapping_test.py +147 -175
brainstate/compile/_ad_checkpoint.py +6 -4
brainstate/compile/_error_if_test.py +1 -0
brainstate/compile/_jit.py +37 -28
brainstate/compile/_loop_collect_return.py +8 -5
brainstate/compile/_loop_no_collection.py +2 -0
brainstate/compile/_make_jaxpr.py +7 -3
brainstate/compile/_make_jaxpr_test.py +2 -1
brainstate/compile/_progress_bar.py +68 -40
brainstate/compile/_unvmap.py +6 -2
brainstate/environ.py +28 -18
brainstate/environ_test.py +4 -0
brainstate/event/__init__.py +0 -2
brainstate/event/_csr.py +266 -23
brainstate/event/_csr_test.py +187 -0
brainstate/event/_fixedprob_mv.py +4 -2
brainstate/event/_fixedprob_mv_test.py +2 -1
brainstate/event/_xla_custom_op.py +16 -5
brainstate/graph/__init__.py +8 -12
brainstate/graph/_graph_node.py +1 -23
brainstate/graph/_graph_operation.py +1 -1
brainstate/graph/_graph_operation_test.py +0 -159
brainstate/nn/_dyn_impl/_inputs.py +124 -39
brainstate/nn/_interaction/_conv.py +4 -2
brainstate/nn/_interaction/_linear.py +84 -10
brainstate/random/_rand_funs.py +9 -2
brainstate/random/_rand_seed.py +12 -2
brainstate/random/_rand_state.py +50 -179
brainstate/surrogate.py +5 -1
brainstate/util/__init__.py +0 -4
brainstate/util/_caller.py +1 -1
brainstate/util/_dict.py +4 -1
brainstate/util/_filter.py +1 -1
brainstate/util/_pretty_repr.py +1 -1
brainstate/util/_struct.py +1 -1
{brainstate-0.1.0.post20250104.dist-info → brainstate-0.1.0.post20250120.dist-info}/METADATA +2 -1
{brainstate-0.1.0.post20250104.dist-info → brainstate-0.1.0.post20250120.dist-info}/RECORD +46 -52
brainstate/event/_csr_mv_test.py +0 -118
brainstate/graph/_graph_context.py +0 -443
brainstate/graph/_graph_context_test.py +0 -65
brainstate/graph/_graph_convert.py +0 -246
brainstate/util/_tracers.py +0 -68
brainstate/util/_visualization.py +0 -47
/brainstate/event/{_csr_mv_benchmark.py → _csr_benchmark.py} +0 -0
{brainstate-0.1.0.post20250104.dist-info → brainstate-0.1.0.post20250120.dist-info}/LICENSE +0 -0
{brainstate-0.1.0.post20250104.dist-info → brainstate-0.1.0.post20250120.dist-info}/WHEEL +0 -0
{brainstate-0.1.0.post20250104.dist-info → brainstate-0.1.0.post20250120.dist-info}/top_level.txt +0 -0

brainstate/event/_csr.py CHANGED Viewed

@@ -73,7 +73,7 @@ class CSR(u.sparse.SparseMatrix):
         return u.sparse.csr_todense(self)
     def transpose(self, axes=None):
-        assert axes is None
+        assert axes is None, "transpose does not support axes argument."
         return CSC((self.data, self.indices, self.indptr), shape=self.shape[::-1])
     def __abs__(self):
@@ -103,6 +103,7 @@ class CSR(u.sparse.SparseMatrix):
                 (op(self.data, other), self.indices, self.indptr),
                 shape=self.shape
             )
         elif other.ndim == 2 and other.shape == self.shape:
             rows, cols = csr_to_coo(self.indices, self.indptr)
             other = other[rows, cols]
@@ -112,6 +113,7 @@ class CSR(u.sparse.SparseMatrix):
                  self.indptr),
                 shape=self.shape
             )
         else:
             raise NotImplementedError(f"mul with object of shape {other.shape}")
@@ -184,10 +186,12 @@ class CSR(u.sparse.SparseMatrix):
         return self._binary_rop(other, operator.mod)
     def __matmul__(self, other):
+        # csr @ other
         if isinstance(other, JAXSparse):
             raise NotImplementedError("matmul between two sparse objects.")
         other = u.math.asarray(other)
-        data, other = u.math.promote_dtypes(self.data, other)
+        data = self.data
+        # data, other = u.math.promote_dtypes(self.data, other)
         if other.ndim == 1:
             return _csr_matvec(
                 data,
@@ -208,10 +212,12 @@ class CSR(u.sparse.SparseMatrix):
             raise NotImplementedError(f"matmul with object of shape {other.shape}")
     def __rmatmul__(self, other):
+        # other @ csr
         if isinstance(other, JAXSparse):
             raise NotImplementedError("matmul between two sparse objects.")
         other = u.math.asarray(other)
-        data, other = u.math.promote_dtypes(self.data, other)
+        data = self.data
+        # data, other = u.math.promote_dtypes(self.data, other)
         if other.ndim == 1:
             return _csr_matvec(
                 data,
@@ -566,7 +572,7 @@ def event_csrmv_cpu_kernel_generator(
     if weight_info.size == 1:
         if transpose:
             if spike_info.dtype == jnp.bool_:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     w = weights[()]
@@ -576,7 +582,7 @@ def event_csrmv_cpu_kernel_generator(
                                 posts[indices[j]] += w
             elif float_as_event:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     w = weights[()]
@@ -586,7 +592,7 @@ def event_csrmv_cpu_kernel_generator(
                                 posts[indices[j]] += w
             else:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     w = weights[()]
@@ -599,7 +605,7 @@ def event_csrmv_cpu_kernel_generator(
         else:
             if spike_info.dtype == jnp.bool_:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     w = weights[()]
                     for i in range(indptr.shape[0] - 1):
@@ -610,7 +616,7 @@ def event_csrmv_cpu_kernel_generator(
                         posts[i] = r
             elif float_as_event:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     w = weights[()]
                     for i in range(indptr.shape[0] - 1):
@@ -621,7 +627,7 @@ def event_csrmv_cpu_kernel_generator(
                         posts[i] = r
             else:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     w = weights[()]
                     for i in range(indptr.shape[0] - 1):
@@ -635,7 +641,7 @@ def event_csrmv_cpu_kernel_generator(
     else:
         if transpose:
             if spike_info.dtype == jnp.bool_:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     for i in range(v.shape[0]):
@@ -644,7 +650,7 @@ def event_csrmv_cpu_kernel_generator(
                                 posts[indices[j]] += weights[j]
             elif float_as_event:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     for i in range(v.shape[0]):
@@ -653,7 +659,7 @@ def event_csrmv_cpu_kernel_generator(
                                 posts[indices[j]] += weights[j]
             else:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     posts[:] = 0.
                     for i in range(v.shape[0]):
@@ -664,7 +670,7 @@ def event_csrmv_cpu_kernel_generator(
         else:
             if spike_info.dtype == jnp.bool_:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     for i in range(indptr.shape[0] - 1):
                         r = 0.
@@ -674,7 +680,7 @@ def event_csrmv_cpu_kernel_generator(
                         posts[i] = r
             elif float_as_event:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     for i in range(indptr.shape[0] - 1):
                         r = 0.
@@ -684,7 +690,7 @@ def event_csrmv_cpu_kernel_generator(
                         posts[i] = r
             else:
-                @numba.njit
+                @numba.njit(fastmath=True)
                 def mv(weights, indices, indptr, v, posts):
                     for i in range(indptr.shape[0] - 1):
                         r = 0.
@@ -795,7 +801,31 @@ def event_csrmv_transpose_rule(
 def event_csrmv_batching(args, axes, **kwargs):
     if tuple(axes) == (None, None, None, 0):
-        return 0, event_csrmm_p_call(*args, **kwargs)
+        assert args[3].ndim == 2, 'Batching axis 0 requires 2D input.'
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            args[3].T,
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        return r, [1]
+    elif tuple(axes) == (None, None, None, 1):
+        assert args[3].ndim == 2, 'Batching axis 0 requires 2D input.'
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            args[3],
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        return r, [1]
     else:
         raise NotImplementedError(f"Batching axes {axes} not implemented for event-driven CSR matrix-vector product.")
@@ -852,17 +882,228 @@ def event_csrmv_p_call(
 def event_csrmm_batching(args, axes, **kwargs):
     if tuple(axes) == (None, None, None, 0):
-        batch_shape = args[3].shape[:-1]
-        B = jnp.reshape(args[3], (-1, args[3].shape[-1:]))
-        r = event_csrmm_p_call(args[0], args[1], args[2], B, **kwargs)
-        return 0, [jnp.reshape(r[0], batch_shape + r.shape[-1:])]
+        assert args[3].ndim == 3, 'Batching axis 0 requires 3D input.'
+        batch_size, m, n = args[3].shape
+        B = jnp.transpose(args[3], (1, 0, 2)).reshape(m, batch_size * n)
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            B,
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        r = jnp.reshape(r[0], [r[0].shape[0], batch_size, n])
+        return [r], [1]
+    elif tuple(axes) == (None, None, None, 1):
+        assert args[3].ndim == 3, 'Batching axis 0 requires 3D input.'
+        m, batch_size, n = args[3].shape
+        B = args[3].reshape(m, batch_size * n)
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            B,
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        r = jnp.reshape(r[0], [r[0].shape[0], batch_size, n])
+        return [r], [1]
+    elif tuple(axes) == (None, None, None, 2):
+        assert args[3].ndim == 3, 'Batching axis 0 requires 3D input.'
+        m, n, batch_size = args[3].shape
+        B = args[3].reshape(m, batch_size * n)
+        r = event_csrmm_p_call(
+            args[0],
+            args[1],
+            args[2],
+            B,
+            shape=kwargs['shape'],
+            transpose=kwargs['transpose'],
+            float_as_event=kwargs['float_as_event']
+        )
+        r = jnp.reshape(r[0], [r[0].shape[0], n, batch_size])
+        return [r], [2]
     else:
         raise NotImplementedError(f"Batching axes {axes} not implemented for event-driven CSR matrix-vector product.")
+def event_csrmm_cpu_kernel_generator(
+    float_as_event: bool,
+    weight_info: jax.ShapeDtypeStruct,
+    spike_info: jax.ShapeDtypeStruct,
+    transpose: bool,
+    **kwargs
+) -> Kernel:
+    import numba  # pylint: disable=import-outside-toplevel
+    if weight_info.size == 1:
+        if transpose:
+            # csr.T @ B
+            if spike_info.dtype == jnp.bool_:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    w = weights[()]
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            if B[i, k]:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += w
+            elif float_as_event:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    B = B != 0.
+                    w = weights[()]
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            if B[i, k]:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += w
+            else:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    w = weights[()]
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            sp = B[i, k]
+                            if sp != 0.:
+                                wsp = w * sp
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += wsp
+        else:
+            # csr @ B
+            if spike_info.dtype == jnp.bool_:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    w = weights[()]
+                    for i in range(indptr.shape[0] - 1):
+                        r = np.zeros(B.shape[1], dtype=weights.dtype)
+                        for j in range(indptr[i], indptr[i + 1]):
+                            index = indices[j]
+                            for k in range(B.shape[1]):
+                                if B[index, k]:
+                                    r[k] += w
+                        posts[i] = r
+            elif float_as_event:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    w = weights[()]
+                    B = B != 0.
+                    for i in range(indptr.shape[0] - 1):
+                        r = np.zeros(B.shape[1], dtype=weights.dtype)
+                        for j in range(indptr[i], indptr[i + 1]):
+                            index = indices[j]
+                            for k in range(B.shape[1]):
+                                if B[index, k]:
+                                    r[k] += w
+                        posts[i] = r
+            else:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    w = weights[()]
+                    for i in range(indptr.shape[0] - 1):
+                        for k in range(B.shape[1]):
+                            r = 0.
+                            for j in range(indptr[i], indptr[i + 1]):
+                                c = B[indices[j], k]
+                                if c != 0.:
+                                    r += w * c
+                            posts[i, k] = r
+    else:
+        if transpose:
+            # csr.T @ B
+            if spike_info.dtype == jnp.bool_:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            if B[i, k]:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += weights[j]
+            elif float_as_event:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    B = B != 0.
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            if B[i, k]:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += weights[j]
+            else:
+                @numba.njit(fastmath=True, parallel=False)
+                def mv(weights, indices, indptr, B, posts):
+                    posts[:] = 0.
+                    for k in numba.prange(B.shape[1]):
+                        for i in range(B.shape[0]):
+                            sp = B[i, k]
+                            if sp != 0.:
+                                for j in range(indptr[i], indptr[i + 1]):
+                                    posts[indices[j], k] += weights[j] * sp
+        else:
+            # csr @ B
+            if spike_info.dtype == jnp.bool_:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    for i in range(indptr.shape[0] - 1):
+                        for k in range(B.shape[1]):
+                            r = 0.
+                            for j in range(indptr[i], indptr[i + 1]):
+                                if B[indices[j], k]:
+                                    r += weights[j]
+                            posts[i, k] = r
+            elif float_as_event:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    B = B != 0.
+                    for i in range(indptr.shape[0] - 1):
+                        for k in range(B.shape[1]):
+                            r = 0.
+                            for j in range(indptr[i], indptr[i + 1]):
+                                if B[indices[j], k]:
+                                    r += weights[j]
+                            posts[i, k] = r
+            else:
+                @numba.njit(fastmath=True)
+                def mv(weights, indices, indptr, B, posts):
+                    for i in range(indptr.shape[0] - 1):
+                        for k in range(B.shape[1]):
+                            r = 0.
+                            for j in range(indptr[i], indptr[i + 1]):
+                                c = B[indices[j], k]
+                                if c != 0.:
+                                    r += weights[j] * c
+                            posts[i, k] = r
+    return mv
 event_csrmm_p = XLACustomOp(
     'event_csrmm',
-    cpu_kernel_or_generator=event_csrmv_cpu_kernel_generator,
+    cpu_kernel_or_generator=event_csrmm_cpu_kernel_generator,
 )
 event_csrmm_p.def_batching_rule(event_csrmm_batching)
@@ -884,11 +1125,13 @@ def event_csrmm_p_call(
             indptr,
             B,
             outs=[
-                jax.ShapeDtypeStruct([shape[0], B.shape[1]], weights.dtype)
+                jax.ShapeDtypeStruct([shape[1], B.shape[1]], weights.dtype)
                 if transpose else
-                jax.ShapeDtypeStruct([shape[1], B.shape[1]], weights.dtype),
+                jax.ShapeDtypeStruct([shape[0], B.shape[1]], weights.dtype),
             ],
             # block_size=block_size,
+            shape=shape,
+            transpose=transpose,
             float_as_event=float_as_event,
             weight_info=jax.ShapeDtypeStruct(weights.shape, weights.dtype),
             spike_info=jax.ShapeDtypeStruct(B.shape, B.dtype),

brainstate/event/_csr_test.py CHANGED Viewed

@@ -18,6 +18,9 @@
 import unittest
 import brainunit as u
+import jax
+import jax.numpy as jnp
+import numpy as np
 import brainstate as bst
@@ -88,3 +91,187 @@ class TestCSR(unittest.TestCase):
                 v @ csr
             )
         )
+def _get_csr(n_pre, n_post, prob):
+    n_conn = int(n_post * prob)
+    indptr = np.arange(n_pre + 1) * n_conn
+    indices = np.random.randint(0, n_post, (n_pre * n_conn,))
+    return indptr, indices
+def vector_csr(x, w, indices, indptr, shape):
+    homo_w = jnp.size(w) == 1
+    post = jnp.zeros((shape[1],))
+    for i_pre in range(x.shape[0]):
+        ids = indices[indptr[i_pre]: indptr[i_pre + 1]]
+        post = post.at[ids].add(w * x[i_pre] if homo_w else w[indptr[i_pre]: indptr[i_pre + 1]] * x[i_pre])
+    return post
+def matrix_csr(xs, w, indices, indptr, shape):
+    homo_w = jnp.size(w) == 1
+    post = jnp.zeros((xs.shape[0], shape[1]))
+    for i_pre in range(xs.shape[1]):
+        ids = indices[indptr[i_pre]: indptr[i_pre + 1]]
+        post = post.at[:, ids].add(
+            w * xs[:, i_pre: i_pre + 1]
+            if homo_w else
+            (w[indptr[i_pre]: indptr[i_pre + 1]] * xs[:, i_pre: i_pre + 1])
+        )
+    return post
+def csr_vector(x, w, indices, indptr, shape):
+    homo_w = jnp.size(w) == 1
+    out = jnp.zeros([shape[0]])
+    for i in range(shape[0]):
+        ids = indices[indptr[i]: indptr[i + 1]]
+        ws = w if homo_w else w[indptr[i]: indptr[i + 1]]
+        out = out.at[i].set(jnp.sum(x[ids] * ws))
+    return out
+def csr_matrix(xs, w, indices, indptr, shape):
+    # CSR @ matrix
+    homo_w = jnp.size(w) == 1
+    out = jnp.zeros([shape[0], xs.shape[1]])
+    for i in range(shape[0]):
+        ids = indices[indptr[i]: indptr[i + 1]]
+        ws = w if homo_w else jnp.expand_dims(w[indptr[i]: indptr[i + 1]], axis=1)
+        out = out.at[i].set(jnp.sum(xs[ids] * ws, axis=0))
+    return out
+class TestVectorCSR(unittest.TestCase):
+    def test_vector_csr(self, ):
+        m, n = 20, 40
+        x = bst.random.rand(m) < 0.1
+        indptr, indices = _get_csr(m, n, 0.1)
+        for homo_w in [True, False]:
+            print(f'homo_w = {homo_w}')
+            data = 1.5 if homo_w else bst.init.Normal()(indices.shape)
+            csr = bst.event.CSR([data, indices, indptr], shape=(m, n))
+            y = x @ csr
+            y2 = vector_csr(x, csr.data, indices, indptr, [m, n])
+            self.assertTrue(jnp.allclose(y, y2))
+    def test_vector_csr_vmap_vector(self):
+        n_batch, m, n = 10, 20, 40
+        xs = bst.random.rand(n_batch, m) < 0.1
+        indptr, indices = _get_csr(m, n, 0.1)
+        for homo_w in [True, False]:
+            data = 1.5 if homo_w else bst.init.Normal()(indices.shape)
+            csr = bst.event.CSR([data, indices, indptr], shape=(m, n))
+            y = jax.vmap(lambda x: x @ csr)(xs)
+            y2 = jax.vmap(lambda x: vector_csr(x, csr.data, indices, indptr, [m, n]))(xs)
+            self.assertTrue(jnp.allclose(y, y2))
+class TestMatrixCSR(unittest.TestCase):
+    def test_matrix_csr(self):
+        k, m, n = 10, 20, 40
+        x = bst.random.rand(k, m) < 0.1
+        indptr, indices = _get_csr(m, n, 0.1)
+        for homo_w in [True, False]:
+            data = 1.5 if homo_w else bst.init.Normal()(indices.shape)
+            csr = bst.event.CSR([data, indices, indptr], shape=(m, n))
+            y = x @ csr
+            y2 = matrix_csr(x, csr.data, indices, indptr, [m, n])
+            self.assertTrue(jnp.allclose(y, y2))
+class TestCSRVector(unittest.TestCase):
+    def test_csr_vector(self):
+        m, n = 20, 40
+        v = bst.random.rand(n) < 0.1
+        indptr, indices = _get_csr(m, n, 0.1)
+        for homo_w in [True, False]:
+            data = 1.5 if homo_w else bst.init.Normal()(indices.shape)
+            csr = bst.event.CSR([data, indices, indptr], shape=(m, n))
+            y = csr @ v
+            y2 = csr_vector(v, csr.data, indices, indptr, [m, n])
+            self.assertTrue(jnp.allclose(y, y2))
+class TestCSRMatrix(unittest.TestCase):
+    def test_csr_matrix(self):
+        m, n, k = 20, 40, 10
+        matrix = bst.random.rand(n, k) < 0.1
+        indptr, indices = _get_csr(m, n, 0.1)
+        for homo_w in [True, False]:
+            data = 1.5 if homo_w else bst.init.Normal()(indices.shape)
+            csr = bst.event.CSR([data, indices, indptr], shape=(m, n))
+            y = csr @ matrix
+            y2 = csr_matrix(matrix, csr.data, indices, indptr, [m, n])
+            self.assertTrue(jnp.allclose(y, y2))
+    # @parameterized.product(
+    #     bool_x=[True, False],
+    #     homo_w=[True, False]
+    # )
+    # def test_vjp(self, bool_x, homo_w):
+    #     n_in = 20
+    #     n_out = 30
+    #     if bool_x:
+    #         x = jax.numpy.asarray(bst.random.rand(n_in) < 0.3, dtype=float)
+    #     else:
+    #         x = bst.random.rand(n_in)
+    #
+    #     indptr, indices = _get_csr(n_in, n_out, 0.1)
+    #     fn = bst.event.CSRLinear(n_in, n_out, indptr, indices, 1.5 if homo_w else bst.init.Normal())
+    #     w = fn.weight.value
+    #
+    #     def f(x, w):
+    #         fn.weight.value = w
+    #         return fn(x).sum()
+    #
+    #     r = jax.grad(f, argnums=(0, 1))(x, w)
+    #
+    #     # -------------------
+    #     # TRUE gradients
+    #
+    #     def f2(x, w):
+    #         return true_fn(x, w, indices, indptr, n_out).sum()
+    #
+    #     r2 = jax.grad(f2, argnums=(0, 1))(x, w)
+    #     self.assertTrue(jnp.allclose(r[0], r2[0]))
+    #     self.assertTrue(jnp.allclose(r[1], r2[1]))
+    #
+    # @parameterized.product(
+    #     bool_x=[True, False],
+    #     homo_w=[True, False]
+    # )
+    # def test_jvp(self, bool_x, homo_w):
+    #     n_in = 20
+    #     n_out = 30
+    #     if bool_x:
+    #         x = jax.numpy.asarray(bst.random.rand(n_in) < 0.3, dtype=float)
+    #     else:
+    #         x = bst.random.rand(n_in)
+    #
+    #     indptr, indices = _get_csr(n_in, n_out, 0.1)
+    #     fn = bst.event.CSRLinear(n_in, n_out, indptr, indices,
+    #                              1.5 if homo_w else bst.init.Normal(), grad_mode='jvp')
+    #     w = fn.weight.value
+    #
+    #     def f(x, w):
+    #         fn.weight.value = w
+    #         return fn(x)
+    #
+    #     o1, r1 = jax.jvp(f, (x, w), (jnp.ones_like(x), jnp.ones_like(w)))
+    #
+    #     # -------------------
+    #     # TRUE gradients
+    #
+    #     def f2(x, w):
+    #         return true_fn(x, w, indices, indptr, n_out)
+    #
+    #     o2, r2 = jax.jvp(f2, (x, w), (jnp.ones_like(x), jnp.ones_like(w)))
+    #     self.assertTrue(jnp.allclose(r1, r2))
+    #     self.assertTrue(jnp.allclose(o1, o2))

brainstate/event/_fixedprob_mv.py CHANGED Viewed

@@ -24,6 +24,7 @@ import jax.numpy as jnp
 import numpy as np
 from jax.interpreters import ad
+from brainstate import environ
 from brainstate._state import ParamState
 from brainstate.augment import vmap
 from brainstate.init import param
@@ -111,7 +112,7 @@ class FixedProb(Module):
     def update(self, spk: jax.Array) -> Union[jax.Array, u.Quantity]:
         if self.n_conn > 1:
-            return event_fixed_prob(
+            r = event_fixed_prob(
                 spk,
                 self.weight.value,
                 self.indices,
@@ -123,7 +124,8 @@ class FixedProb(Module):
             weight = self.weight.value
             unit = u.get_unit(weight)
             r = jnp.zeros(spk.shape[:-1] + (self.out_size[-1],), dtype=weight.dtype)
-            return u.maybe_decimal(u.Quantity(r, unit=unit))
+            r = u.maybe_decimal(u.Quantity(r, unit=unit))
+        return u.math.asarray(r, dtype=environ.dftype())
 def event_fixed_prob(

brainstate/event/_fixedprob_mv_test.py CHANGED Viewed

@@ -128,4 +128,5 @@ class TestFixedProbCSR(parameterized.TestCase):
         o2, r2 = jax.jvp(f2, (x, w), (jnp.ones_like(x), jnp.ones_like(w)))
         self.assertTrue(jnp.allclose(o1, o2))
-        self.assertTrue(jnp.allclose(r1, r2))
+        # assert jnp.allclose(r1, r2), f'r1={r1}, r2={r2}'
+        self.assertTrue(jnp.allclose(r1, r2, rtol=1e-4, atol=1e-4))

brainstate 0.1.0.post20250104__py2.py3-none-any.whl → 0.1.0.post20250120__py2.py3-none-any.whl

brainstate 0.1.0.post20250104py2.py3-none-any.whl → 0.1.0.post20250120py2.py3-none-any.whl