PyPI - bartz - Versions diffs - 0.1.0__tar.gz → 0.2.0__tar.gz - Mend

bartz 0.1.0tar.gz → 0.2.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

{bartz-0.1.0 → bartz-0.2.0}/PKG-INFO +7 -1
bartz-0.2.0/README.md +9 -0
{bartz-0.1.0 → bartz-0.2.0}/pyproject.toml +3 -2
bartz-0.1.0/src/bartz/interface.py → bartz-0.2.0/src/bartz/BART.py +4 -3
{bartz-0.1.0 → bartz-0.2.0}/src/bartz/__init__.py +6 -1
bartz-0.2.0/src/bartz/_version.py +1 -0
{bartz-0.1.0 → bartz-0.2.0}/src/bartz/debug.py +5 -4
{bartz-0.1.0 → bartz-0.2.0}/src/bartz/grove.py +36 -36
bartz-0.2.0/src/bartz/jaxext.py +341 -0
{bartz-0.1.0 → bartz-0.2.0}/src/bartz/mcmcloop.py +19 -11
{bartz-0.1.0 → bartz-0.2.0}/src/bartz/mcmcstep.py +192 -73
{bartz-0.1.0 → bartz-0.2.0}/src/bartz/prepcovars.py +25 -30
bartz-0.1.0/README.md +0 -3
bartz-0.1.0/src/bartz/_version.py +0 -1
bartz-0.1.0/src/bartz/jaxext.py +0 -85
{bartz-0.1.0 → bartz-0.2.0}/LICENSE +0 -0

{bartz-0.1.0 → bartz-0.2.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: bartz
-Version: 0.1.0
+Version: 0.2.0
 Summary: A JAX implementation of BART
 Home-page: https://github.com/Gattocrucco/bartz
 License: MIT
@@ -20,7 +20,13 @@ Project-URL: Bug Tracker, https://github.com/Gattocrucco/bartz/issues
 Project-URL: Repository, https://github.com/Gattocrucco/bartz
 Description-Content-Type: text/markdown
+[![PyPI](https://img.shields.io/pypi/v/bartz)](https://pypi.org/project/bartz/)
 # BART vectoriZed
 A branchless vectorized implementation of Bayesian Additive Regression Trees (BART) in JAX.
+BART is a nonparametric Bayesian regression technique. Given predictors $X$ and responses $y$, BART finds a function to predict $y$ given $X$. The result of the inference is a sample of possible functions, representing the uncertainty over the determination of the function.
+This Python module provides an implementation of BART that runs on GPU, to process large datasets faster. It is also a good on CPU. Most other implementations of BART are for R, and run on CPU only.

bartz-0.2.0/README.md ADDED Viewed

@@ -0,0 +1,9 @@
+[![PyPI](https://img.shields.io/pypi/v/bartz)](https://pypi.org/project/bartz/)
+# BART vectoriZed
+A branchless vectorized implementation of Bayesian Additive Regression Trees (BART) in JAX.
+BART is a nonparametric Bayesian regression technique. Given predictors $X$ and responses $y$, BART finds a function to predict $y$ given $X$. The result of the inference is a sample of possible functions, representing the uncertainty over the determination of the function.
+This Python module provides an implementation of BART that runs on GPU, to process large datasets faster. It is also a good on CPU. Most other implementations of BART are for R, and run on CPU only.

{bartz-0.1.0 → bartz-0.2.0}/pyproject.toml RENAMED Viewed

@@ -28,7 +28,7 @@ build-backend = "poetry.core.masonry.api"
 [tool.poetry]
 name = "bartz"
-version = "0.1.0"
+version = "0.2.0"
 description = "A JAX implementation of BART"
 authors = ["Giacomo Petrillo <info@giacomopetrillo.com>"]
 license = "MIT"
@@ -53,6 +53,7 @@ ipython = "^8.22.2"
 matplotlib = "^3.8.3"
 appnope = "^0.1.4"
 tomli = "^2.0.1"
+packaging = "^24.0"
 [tool.poetry.group.test.dependencies]
 coverage = "^7.4.3"
@@ -60,7 +61,7 @@ pytest = "^8.1.1"
 [tool.poetry.group.docs.dependencies]
 Sphinx = "^7.2.6"
-numpydoc = "^1.6.0"
+numpydoc = "^1.6.0,<1.7.0" # 1.7.0 breaks linkcode, it seems
 myst-parser = "^2.0.0"
 [tool.pytest.ini_options]

bartz-0.1.0/src/bartz/interface.py → bartz-0.2.0/src/bartz/BART.py RENAMED Viewed

@@ -1,4 +1,4 @@
-# bartz/src/bartz/interface.py
+# bartz/src/bartz/BART.py
 #
 # Copyright (c) 2024, Giacomo Petrillo
 #
@@ -33,7 +33,7 @@ from . import mcmcstep
 from . import mcmcloop
 from . import prepcovars
-class BART:
+class gbart:
     """
     Nonparametric regression with Bayesian Additive Regression Trees (BART).
@@ -133,7 +133,7 @@ class BART:
     Notes
     -----
-    This interface imitates the function `wbart` from the R package `BART
+    This interface imitates the function `gbart` from the R package `BART
     <https://cran.r-project.org/package=BART>`_, but with these differences:
     - If `x_train` and `x_test` are matrices, they have one predictor per row
@@ -142,6 +142,7 @@ class BART:
     - `usequants` is always `True`.
     - `rm_const` is always `False`.
     - The default `numcut` is 255 instead of 100.
+    - A lot of functionality is missing (variable selection, discrete response).
     - There are some additional attributes, and some missing.
     """

{bartz-0.1.0 → bartz-0.2.0}/src/bartz/__init__.py RENAMED Viewed

@@ -30,6 +30,11 @@ See the manual at https://gattocrucco.github.io/bartz/docs
 from ._version import __version__
-from .interface import BART
+from . import BART
 from . import debug
+from . import grove
+from . import mcmcstep
+from . import mcmcloop
+from . import prepcovars
+from . import jaxext

bartz-0.2.0/src/bartz/_version.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = '0.2.0'

{bartz-0.1.0 → bartz-0.2.0}/src/bartz/debug.py RENAMED Viewed

@@ -6,6 +6,7 @@ from jax import lax
 from . import grove
 from . import mcmcstep
+from . import jaxext
 def print_tree(leaf_tree, var_tree, split_tree, print_all=False):
@@ -83,7 +84,7 @@ def trace_depth_distr(split_trees_trace):
 def points_per_leaf_distr(var_tree, split_tree, X):
     traverse_tree = jax.vmap(grove.traverse_tree, in_axes=(1, None, None))
     indices = traverse_tree(X, var_tree, split_tree)
-    count_tree = jnp.zeros(2 * split_tree.size, dtype=grove.minimal_unsigned_dtype(indices.size))
+    count_tree = jnp.zeros(2 * split_tree.size, dtype=jaxext.minimal_unsigned_dtype(indices.size))
     count_tree = count_tree.at[indices].add(1)
     is_leaf = grove.is_actual_leaf(split_tree, add_bottom_level=True).view(jnp.uint8)
     return jnp.bincount(count_tree, is_leaf, length=X.shape[1] + 1)
@@ -103,7 +104,7 @@ def trace_points_per_leaf_distr(bart, X):
     return distr
 def check_types(leaf_tree, var_tree, split_tree, max_split):
-    expected_var_dtype = grove.minimal_unsigned_dtype(max_split.size - 1)
+    expected_var_dtype = jaxext.minimal_unsigned_dtype(max_split.size - 1)
     expected_split_dtype = max_split.dtype
     return var_tree.dtype == expected_var_dtype and split_tree.dtype == expected_split_dtype
@@ -117,7 +118,7 @@ def check_leaf_values(leaf_tree, var_tree, split_tree, max_split):
     return jnp.all(jnp.isfinite(leaf_tree))
 def check_stray_nodes(leaf_tree, var_tree, split_tree, max_split):
-    index = jnp.arange(2 * split_tree.size, dtype=grove.minimal_unsigned_dtype(2 * split_tree.size - 1))
+    index = jnp.arange(2 * split_tree.size, dtype=jaxext.minimal_unsigned_dtype(2 * split_tree.size - 1))
     parent_index = index >> 1
     is_not_leaf = split_tree.at[index].get(mode='fill', fill_value=0) != 0
     parent_is_leaf = split_tree[parent_index] == 0
@@ -134,7 +135,7 @@ check_functions = [
 ]
 def check_tree(leaf_tree, var_tree, split_tree, max_split):
-    error_type = grove.minimal_unsigned_dtype(2 ** len(check_functions) - 1)
+    error_type = jaxext.minimal_unsigned_dtype(2 ** len(check_functions) - 1)
     error = error_type(0)
     for i, func in enumerate(check_functions):
         ok = func(leaf_tree, var_tree, split_tree, max_split)

{bartz-0.1.0 → bartz-0.2.0}/src/bartz/grove.py RENAMED Viewed

@@ -44,7 +44,6 @@ import functools
 import math
 import jax
 from jax import numpy as jnp
 from jax import lax
@@ -107,29 +106,47 @@ def traverse_tree(x, var_tree, split_tree):
     carry = (
         jnp.zeros((), bool),
-        jnp.ones((), minimal_unsigned_dtype(2 * var_tree.size - 1)),
+        jnp.ones((), jaxext.minimal_unsigned_dtype(2 * var_tree.size - 1)),
     )
     def loop(carry, _):
         leaf_found, index = carry
-        split = split_tree.at[index].get(mode='fill', fill_value=0)
-        var = var_tree.at[index].get(mode='fill', fill_value=0)
+        split = split_tree[index]
+        var = var_tree[index]
-        leaf_found |= split_tree.at[index].get(mode='fill', fill_value=0) == 0
+        leaf_found |= split == 0
         child_index = (index << 1) + (x[var] >= split)
         index = jnp.where(leaf_found, index, child_index)
         return (leaf_found, index), None
-        # TODO
-        # - unroll (how much? 5?)
-        # - separate and special-case the last iteration
-    depth = 1 + tree_depth(var_tree)
-    (_, index), _ = lax.scan(loop, carry, None, depth)
+    depth = tree_depth(var_tree)
+    (_, index), _ = lax.scan(loop, carry, None, depth, unroll=16)
     return index
+@functools.partial(jaxext.vmap_nodoc, in_axes=(None, 0, 0))
+@functools.partial(jaxext.vmap_nodoc, in_axes=(1, None, None))
+def traverse_forest(X, var_trees, split_trees):
+    """
+    Find the leaves where points fall into.
+    Parameters
+    ----------
+    X : array (p, n)
+        The coordinates to evaluate the trees at.
+    var_trees : array (m, 2 ** (d - 1))
+        The decision axes of the trees.
+    split_trees : array (m, 2 ** (d - 1))
+        The decision boundaries of the trees.
+    Returns
+    -------
+    indices : array (m, n)
+        The indices of the leaves.
+    """
+    return traverse_tree(X, var_trees, split_trees)
 def evaluate_forest(X, leaf_trees, var_trees, split_trees, dtype):
     """
     Evaluate a ensemble of trees at an array of points.
@@ -138,7 +155,7 @@ def evaluate_forest(X, leaf_trees, var_trees, split_trees, dtype):
     ----------
     X : array (p, n)
         The coordinates to evaluate the trees at.
-    leaf_trees : (m, 2 ** d)
+    leaf_trees : array (m, 2 ** d)
         The leaf values of the tree or forest. If the input is a forest, the
         first axis is the tree index, and the values are summed.
     var_trees : array (m, 2 ** (d - 1))
@@ -153,30 +170,13 @@ def evaluate_forest(X, leaf_trees, var_trees, split_trees, dtype):
     out : array (n,)
         The sum of the values of the trees at the points in `X`.
     """
-    indices = _traverse_forest(X, var_trees, split_trees)
+    indices = traverse_forest(X, var_trees, split_trees)
     ntree, _ = leaf_trees.shape
-    tree_index = jnp.arange(ntree, dtype=minimal_unsigned_dtype(ntree - 1))[:, None]
+    tree_index = jnp.arange(ntree, dtype=jaxext.minimal_unsigned_dtype(ntree - 1))[:, None]
     leaves = leaf_trees[tree_index, indices]
     return jnp.sum(leaves, axis=0, dtype=dtype)
-        # this sum suggests to swap the vmaps, but I think it's better for X copying to keep it that way
-@functools.partial(jax.vmap, in_axes=(None, 0, 0))
-@functools.partial(jax.vmap, in_axes=(1, None, None))
-def _traverse_forest(X, var_trees, split_trees):
-    return traverse_tree(X, var_trees, split_trees)
-def minimal_unsigned_dtype(max_value):
-    """
-    Return the smallest unsigned integer dtype that can represent a given
-    maximum value.
-    """
-    if max_value < 2 ** 8:
-        return jnp.uint8
-    if max_value < 2 ** 16:
-        return jnp.uint16
-    if max_value < 2 ** 32:
-        return jnp.uint32
-    return jnp.uint64
+        # this sum suggests to swap the vmaps, but I think it's better for X
+        # copying to keep it that way
 def is_actual_leaf(split_tree, *, add_bottom_level=False):
     """
@@ -200,7 +200,7 @@ def is_actual_leaf(split_tree, *, add_bottom_level=False):
     if add_bottom_level:
         size *= 2
         is_leaf = jnp.concatenate([is_leaf, jnp.ones_like(is_leaf)])
-    index = jnp.arange(size, dtype=minimal_unsigned_dtype(size - 1))
+    index = jnp.arange(size, dtype=jaxext.minimal_unsigned_dtype(size - 1))
     parent_index = index >> 1
     parent_nonleaf = split_tree[parent_index].astype(bool)
     parent_nonleaf = parent_nonleaf.at[1].set(True)
@@ -220,7 +220,7 @@ def is_leaves_parent(split_tree):
     is_leaves_parent : bool array (2 ** (d - 1),)
         The mask indicating which nodes have leaf children.
     """
-    index = jnp.arange(split_tree.size, dtype=minimal_unsigned_dtype(2 * split_tree.size - 1))
+    index = jnp.arange(split_tree.size, dtype=jaxext.minimal_unsigned_dtype(2 * split_tree.size - 1))
     left_index = index << 1 # left child
     right_index = left_index + 1 # right child
     left_leaf = split_tree.at[left_index].get(mode='fill', fill_value=0) == 0
@@ -252,4 +252,4 @@ def tree_depths(tree_length):
             depth += 1
         depths.append(depth - 1)
     depths[0] = 0
-    return jnp.array(depths, minimal_unsigned_dtype(max(depths)))
+    return jnp.array(depths, jaxext.minimal_unsigned_dtype(max(depths)))

bartz-0.2.0/src/bartz/jaxext.py ADDED Viewed

@@ -0,0 +1,341 @@
+# bartz/src/bartz/jaxext.py
+#
+# Copyright (c) 2024, Giacomo Petrillo
+#
+# This file is part of bartz.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+import functools
+import math
+import warnings
+from scipy import special
+import jax
+from jax import numpy as jnp
+from jax import tree_util
+from jax import lax
+def float_type(*args):
+    """
+    Determine the jax floating point result type given operands/types.
+    """
+    t = jnp.result_type(*args)
+    return jnp.sin(jnp.empty(0, t)).dtype
+def castto(func, type):
+    @functools.wraps(func)
+    def newfunc(*args, **kw):
+        return func(*args, **kw).astype(type)
+    return newfunc
+def pure_callback_ufunc(callback, dtype, *args, excluded=None, **kwargs):
+    """ version of `jax.pure_callback` that deals correctly with ufuncs,
+    see `<https://github.com/google/jax/issues/17187>`_ """
+    if excluded is None:
+        excluded = ()
+    shape = jnp.broadcast_shapes(*(
+        a.shape
+        for i, a in enumerate(args)
+        if i not in excluded
+    ))
+    ndim = len(shape)
+    padded_args = [
+        a if i in excluded
+        else jnp.expand_dims(a, tuple(range(ndim - a.ndim)))
+        for i, a in enumerate(args)
+    ]
+    result = jax.ShapeDtypeStruct(shape, dtype)
+    return jax.pure_callback(callback, result, *padded_args, vectorized=True, **kwargs)
+    # TODO when jax solves this, check version and piggyback on original if new
+class scipy:
+    class special:
+        @functools.wraps(special.gammainccinv)
+        def gammainccinv(a, y):
+            a = jnp.asarray(a)
+            y = jnp.asarray(y)
+            dtype = float_type(a.dtype, y.dtype)
+            ufunc = castto(special.gammainccinv, dtype)
+            return pure_callback_ufunc(ufunc, dtype, a, y)
+    class stats:
+        class invgamma:
+            def ppf(q, a):
+                return 1 / scipy.special.gammainccinv(a, q)
+@functools.wraps(jax.vmap)
+def vmap_nodoc(fun, *args, **kw):
+    """
+    Version of `jax.vmap` that preserves the docstring of the input function.
+    """
+    doc = fun.__doc__
+    fun = jax.vmap(fun, *args, **kw)
+    fun.__doc__ = doc
+    return fun
+def huge_value(x):
+    """
+    Return the maximum value that can be stored in `x`.
+    Parameters
+    ----------
+    x : array
+        A numerical numpy or jax array.
+    Returns
+    -------
+    maxval : scalar
+        The maximum value allowed by `x`'s type (+inf for floats).
+    """
+    if jnp.issubdtype(x.dtype, jnp.integer):
+        return jnp.iinfo(x.dtype).max
+    else:
+        return jnp.inf
+def minimal_unsigned_dtype(max_value):
+    """
+    Return the smallest unsigned integer dtype that can represent a given
+    maximum value (inclusive).
+    """
+    if max_value < 2 ** 8:
+        return jnp.uint8
+    if max_value < 2 ** 16:
+        return jnp.uint16
+    if max_value < 2 ** 32:
+        return jnp.uint32
+    return jnp.uint64
+def signed_to_unsigned(int_dtype):
+    """
+    Map a signed integer type to its unsigned counterpart. Unsigned types are
+    passed through.
+    """
+    assert jnp.issubdtype(int_dtype, jnp.integer)
+    if jnp.issubdtype(int_dtype, jnp.unsignedinteger):
+        return int_dtype
+    if int_dtype == jnp.int8:
+        return jnp.uint8
+    if int_dtype == jnp.int16:
+        return jnp.uint16
+    if int_dtype == jnp.int32:
+        return jnp.uint32
+    if int_dtype == jnp.int64:
+        return jnp.uint64
+def ensure_unsigned(x):
+    """
+    If x has signed integer type, cast it to the unsigned dtype of the same size.
+    """
+    return x.astype(signed_to_unsigned(x.dtype))
+@functools.partial(jax.jit, static_argnums=(1,))
+def unique(x, size, fill_value):
+    """
+    Restricted version of `jax.numpy.unique` that uses less memory.
+    Parameters
+    ----------
+    x : 1d array
+        The input array.
+    size : int
+        The length of the output.
+    fill_value : scalar
+        The value to fill the output with if `size` is greater than the number
+        of unique values in `x`.
+    Returns
+    -------
+    out : array (size,)
+        The unique values in `x`, sorted, and right-padded with `fill_value`.
+    actual_length : int
+        The number of used values in `out`.
+    """
+    if x.size == 0:
+        return jnp.full(size, fill_value, x.dtype), 0
+    if size == 0:
+        return jnp.empty(0, x.dtype), 0
+    x = jnp.sort(x)
+    def loop(carry, x):
+        i_out, i_in, last, out = carry
+        i_out = jnp.where(x == last, i_out, i_out + 1)
+        out = out.at[i_out].set(x)
+        return (i_out, i_in + 1, x, out), None
+    carry = 0, 0, x[0], jnp.full(size, fill_value, x.dtype)
+    (actual_length, _, _, out), _ = jax.lax.scan(loop, carry, x[:size])
+    return out, actual_length + 1
+def autobatch(func, max_io_nbytes, in_axes=0, out_axes=0, return_nbatches=False):
+    """
+    Batch a function such that each batch is smaller than a threshold.
+    Parameters
+    ----------
+    func : callable
+        A jittable function with positional arguments only, with inputs and
+        outputs pytrees of arrays.
+    max_io_nbytes : int
+        The maximum number of input + output bytes in each batch.
+    in_axes : pytree of ints, default 0
+        A tree matching the structure of the function input, indicating along
+        which axes each array should be batched. If a single integer, it is
+        used for all arrays.
+    out_axes : pytree of ints, default 0
+        The same for outputs.
+    return_nbatches : bool, default False
+        If True, the number of batches is returned as a second output.
+    Returns
+    -------
+    batched_func : callable
+        A function with the same signature as `func`, but that processes the
+        input and output in batches in a loop.
+    """
+    def expand_axes(axes, tree):
+        if isinstance(axes, int):
+            return tree_util.tree_map(lambda _: axes, tree)
+        return tree_util.tree_map(lambda _, axis: axis, tree, axes)
+    def extract_size(axes, tree):
+        sizes = tree_util.tree_map(lambda x, axis: x.shape[axis], tree, axes)
+        sizes, _ = tree_util.tree_flatten(sizes)
+        assert all(s == sizes[0] for s in sizes)
+        return sizes[0]
+    def sum_nbytes(tree):
+        def nbytes(x):
+            return math.prod(x.shape) * x.dtype.itemsize
+        return tree_util.tree_reduce(lambda size, x: size + nbytes(x), tree, 0)
+    def next_divisor_small(dividend, min_divisor):
+        for divisor in range(min_divisor, int(math.sqrt(dividend)) + 1):
+            if dividend % divisor == 0:
+                return divisor
+        return dividend
+    def next_divisor_large(dividend, min_divisor):
+        max_inv_divisor = dividend // min_divisor
+        for inv_divisor in range(max_inv_divisor, 0, -1):
+            if dividend % inv_divisor == 0:
+                return dividend // inv_divisor
+        return dividend
+    def next_divisor(dividend, min_divisor):
+        if min_divisor * min_divisor <= dividend:
+            return next_divisor_small(dividend, min_divisor)
+        return next_divisor_large(dividend, min_divisor)
+    def move_axes_out(axes, tree):
+        def move_axis_out(axis, x):
+            if axis != 0:
+                return jnp.moveaxis(x, axis, 0)
+            return x
+        return tree_util.tree_map(move_axis_out, axes, tree)
+    def move_axes_in(axes, tree):
+        def move_axis_in(axis, x):
+            if axis != 0:
+                return jnp.moveaxis(x, 0, axis)
+            return x
+        return tree_util.tree_map(move_axis_in, axes, tree)
+    def batch(tree, nbatches):
+        def batch(x):
+            return x.reshape((nbatches, x.shape[0] // nbatches) + x.shape[1:])
+        return tree_util.tree_map(batch, tree)
+    def unbatch(tree):
+        def unbatch(x):
+            return x.reshape((x.shape[0] * x.shape[1],) + x.shape[2:])
+        return tree_util.tree_map(unbatch, tree)
+    def check_same(tree1, tree2):
+        def check_same(x1, x2):
+            assert x1.shape == x2.shape
+            assert x1.dtype == x2.dtype
+        tree_util.tree_map(check_same, tree1, tree2)
+    initial_in_axes = in_axes
+    initial_out_axes = out_axes
+    @jax.jit
+    @functools.wraps(func)
+    def batched_func(*args):
+        example_result = jax.eval_shape(func, *args)
+        in_axes = expand_axes(initial_in_axes, args)
+        out_axes = expand_axes(initial_out_axes, example_result)
+        in_size = extract_size(in_axes, args)
+        out_size = extract_size(out_axes, example_result)
+        assert in_size == out_size
+        size = in_size
+        total_nbytes = sum_nbytes(args) + sum_nbytes(example_result)
+        min_nbatches = total_nbytes // max_io_nbytes + bool(total_nbytes % max_io_nbytes)
+        nbatches = next_divisor(size, min_nbatches)
+        assert 1 <= nbatches <= size
+        assert size % nbatches == 0
+        assert total_nbytes % nbatches == 0
+        batch_nbytes = total_nbytes // nbatches
+        if batch_nbytes > max_io_nbytes:
+            assert size == nbatches
+            warnings.warn(f'batch_nbytes = {batch_nbytes} > max_io_nbytes = {max_io_nbytes}')
+        def loop(_, args):
+            args = move_axes_in(in_axes, args)
+            result = func(*args)
+            result = move_axes_out(out_axes, result)
+            return None, result
+        args = move_axes_out(in_axes, args)
+        args = batch(args, nbatches)
+        _, result = lax.scan(loop, None, args)
+        result = unbatch(result)
+        result = move_axes_in(out_axes, result)
+        check_same(example_result, result)
+        if return_nbatches:
+            return result, nbatches
+        return result
+    return batched_func
+@tree_util.register_pytree_node_class
+class LeafDict(dict):
+    """ dictionary that acts as a leaf in jax pytrees, to store compile-time
+    values """
+    def tree_flatten(self):
+        return (), self
+    @classmethod
+    def tree_unflatten(cls, aux_data, children):
+        return aux_data
+    def __repr__(self):
+        return f'{__class__.__name__}({super().__repr__()})'

bartz 0.1.0__tar.gz → 0.2.0__tar.gz

bartz 0.1.0tar.gz → 0.2.0tar.gz