PyPI - bartz - Versions diffs - 0.5.0__py3-none-any.whl → 0.6.0__py3-none-any.whl - Mend

bartz 0.5.0py3-none-any.whl → 0.6.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

bartz/BART.py +196 -103
bartz/__init__.py +1 -1
bartz/_version.py +1 -1
bartz/debug.py +1 -1
bartz/grove.py +43 -2
bartz/jaxext.py +82 -33
bartz/mcmcloop.py +367 -114
bartz/mcmcstep.py +1322 -807
bartz/prepcovars.py +3 -1
{bartz-0.5.0.dist-info → bartz-0.6.0.dist-info}/METADATA +7 -5
bartz-0.6.0.dist-info/RECORD +13 -0
{bartz-0.5.0.dist-info → bartz-0.6.0.dist-info}/WHEEL +1 -1
bartz-0.5.0.dist-info/RECORD +0 -13

bartz/mcmcloop.py CHANGED Viewed

@@ -22,57 +22,141 @@
 # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 # SOFTWARE.
-"""
-Functions that implement the full BART posterior MCMC loop.
-"""
+"""Functions that implement the full BART posterior MCMC loop."""
 import functools
 import jax
-from jax import debug, lax, random, tree
+import numpy
+from jax import debug, lax, tree
 from jax import numpy as jnp
+from jaxtyping import Array, Real
 from . import grove, jaxext, mcmcstep
+from .mcmcstep import State
-@functools.partial(jax.jit, static_argnums=(2, 3, 4, 5))
-def run_mcmc(key, bart, n_burn, n_save, n_skip, callback):
+def default_onlymain_extractor(state: State) -> dict[str, Real[Array, 'samples *']]:
+    """Extract variables for the main trace, to be used in `run_mcmc`."""
+    return dict(
+        leaf_trees=state.forest.leaf_trees,
+        var_trees=state.forest.var_trees,
+        split_trees=state.forest.split_trees,
+        offset=state.offset,
+    )
+def default_both_extractor(state: State) -> dict[str, Real[Array, 'samples *'] | None]:
+    """Extract variables for main & burn-in traces, to be used in `run_mcmc`."""
+    return dict(
+        sigma2=state.sigma2,
+        grow_prop_count=state.forest.grow_prop_count,
+        grow_acc_count=state.forest.grow_acc_count,
+        prune_prop_count=state.forest.prune_prop_count,
+        prune_acc_count=state.forest.prune_acc_count,
+        log_likelihood=state.forest.log_likelihood,
+        log_trans_prior=state.forest.log_trans_prior,
+    )
+def run_mcmc(
+    key,
+    bart,
+    n_save,
+    *,
+    n_burn=0,
+    n_skip=1,
+    inner_loop_length=None,
+    allow_overflow=False,
+    inner_callback=None,
+    outer_callback=None,
+    callback_state=None,
+    onlymain_extractor=default_onlymain_extractor,
+    both_extractor=default_both_extractor,
+):
     """
     Run the MCMC for the BART posterior.
     Parameters
     ----------
     key : jax.dtypes.prng_key array
-        The key for random number generation.
+        A key for random number generation.
     bart : dict
         The initial MCMC state, as created and updated by the functions in
-        `bartz.mcmcstep`.
-    n_burn : int
-        The number of initial iterations which are not saved.
+        `bartz.mcmcstep`. The MCMC loop uses buffer donation to avoid copies,
+        so this variable is invalidated after running `run_mcmc`. Make a copy
+        beforehand to use it again.
     n_save : int
         The number of iterations to save.
-    n_skip : int
+    n_burn : int, default 0
+        The number of initial iterations which are not saved.
+    n_skip : int, default 1
         The number of iterations to skip between each saved iteration, plus 1.
         The effective burn-in is ``n_burn + n_skip - 1``.
-    callback : callable
-        An arbitrary function run at each iteration, called with the following
-        arguments, passed by keyword:
+    inner_loop_length : int, optional
+        The MCMC loop is split into an outer and an inner loop. The outer loop
+        is in Python, while the inner loop is in JAX. `inner_loop_length` is the
+        number of iterations of the inner loop to run for each iteration of the
+        outer loop. If not specified, the outer loop will iterate just once,
+        with all iterations done in a single inner loop run. The inner stride is
+        unrelated to the stride used for saving the trace.
+    allow_overflow : bool, default False
+        If `False`, `inner_loop_length` must be a divisor of the total number of
+        iterations ``n_burn + n_skip * n_save``. If `True` and
+        `inner_loop_length` is not a divisor, some of the MCMC iterations in the
+        last outer loop iteration will not be saved to the trace.
+    inner_callback : callable, optional
+    outer_callback : callable, optional
+        Arbitrary functions run during the loop after updating the state.
+        `inner_callback` is called after each update, while `outer_callback` is
+        called after completing an inner loop. The callbacks are invoked with
+        the following arguments, passed by keyword:
         bart : dict
             The MCMC state just after updating it.
         burnin : bool
             Whether the last iteration was in the burn-in phase.
+        overflow : bool
+            Whether the last iteration was in the overflow phase (iterations
+            not saved due to `inner_loop_length` not being a divisor of the
+            total number of iterations).
         i_total : int
-            The index of the last iteration (0-based).
+            The index of the last MCMC iteration (0-based).
         i_skip : int
             The number of MCMC updates from the last saved state. The initial
             state counts as saved, even if it's not copied into the trace.
+        callback_state : jax pytree
+            The callback state, initially set to the argument passed to
+            `run_mcmc`, afterwards to the value returned by the last invocation
+            of `inner_callback` or `outer_callback`.
         n_burn, n_save, n_skip : int
             The corresponding arguments as-is.
+        i_outer : int
+            The index of the last outer loop iteration (0-based).
+        inner_loop_length : int
+            The number of MCMC iterations in the inner loop.
+        `inner_callback` is called under the jax jit, so the argument values are
+        not available at the time the Python code is executed. Use the utilities
+        in `jax.debug` to access the values at actual runtime.
-        Since this function is called under the jax jit, the values are not
-        available at the time the Python code is executed. Use the utilities in
-        `jax.debug` to access the values at actual runtime.
+        The callbacks must return two values:
+        bart : dict
+            A possibly modified MCMC state. To avoid modifying the state,
+            return the `bart` argument passed to the callback as-is.
+        callback_state : jax pytree
+            The new state to be passed on the next callback invocation.
+        For convenience, if a callback returns `None`, the states are not
+        updated.
+    callback_state : jax pytree, optional
+        The initial state for the callbacks.
+    onlymain_extractor : callable, optional
+    both_extractor : callable, optional
+        Functions that extract the variables to be saved respectively only in
+        the main trace and in both traces, given the MCMC state as argument.
+        Must return a pytree, and must be vmappable.
     Returns
     -------
@@ -82,12 +166,20 @@ def run_mcmc(key, bart, n_burn, n_save, n_skip, callback):
         The trace of the burn-in phase, containing the following subset of
         fields from the `bart` dictionary, with an additional head index that
         runs over MCMC iterations: 'sigma2', 'grow_prop_count',
-        'grow_acc_count', 'prune_prop_count', 'prune_acc_count'.
+        'grow_acc_count', 'prune_prop_count', 'prune_acc_count' (or if specified
+        the fields in `tracevars_both`).
     main_trace : dict of (n_save, ...) arrays
         The trace of the main phase, containing the following subset of fields
-        from the `bart` dictionary, with an additional head index that runs
-        over MCMC iterations: 'leaf_trees', 'var_trees', 'split_trees', plus
-        the fields in `burnin_trace`.
+        from the `bart` dictionary, with an additional head index that runs over
+        MCMC iterations: 'leaf_trees', 'var_trees', 'split_trees' (or if
+        specified the fields in `tracevars_onlymain`), plus the fields in
+        `burnin_trace`.
+    Raises
+    ------
+    ValueError
+        If `inner_loop_length` is not a divisor of the total number of
+        iterations and `allow_overflow` is `False`.
     Notes
     -----
@@ -95,49 +187,118 @@ def run_mcmc(key, bart, n_burn, n_save, n_skip, callback):
     not include the initial state, and include the final state.
     """
-    tracevars_light = (
-        'sigma2',
-        'grow_prop_count',
-        'grow_acc_count',
-        'prune_prop_count',
-        'prune_acc_count',
-        'ratios',
-    )
-    tracevars_heavy = ('leaf_trees', 'var_trees', 'split_trees')
+    def empty_trace(length, bart, extractor):
+        return jax.vmap(extractor, in_axes=None, out_axes=0, axis_size=length)(bart)
+    trace_both = empty_trace(n_burn + n_save, bart, both_extractor)
+    trace_onlymain = empty_trace(n_save, bart, onlymain_extractor)
+    # determine number of iterations for inner and outer loops
+    n_iters = n_burn + n_skip * n_save
+    if inner_loop_length is None:
+        inner_loop_length = n_iters
+    n_outer = n_iters // inner_loop_length
+    if n_iters % inner_loop_length:
+        if allow_overflow:
+            n_outer += 1
+        else:
+            raise ValueError(f'{n_iters=} is not divisible by {inner_loop_length=}')
+    carry = (bart, 0, key, trace_both, trace_onlymain, callback_state)
+    for i_outer in range(n_outer):
+        carry = _run_mcmc_inner_loop(
+            carry,
+            inner_loop_length,
+            inner_callback,
+            onlymain_extractor,
+            both_extractor,
+            n_burn,
+            n_save,
+            n_skip,
+            i_outer,
+        )
+        if outer_callback is not None:
+            bart, i_total, key, trace_both, trace_onlymain, callback_state = carry
+            i_total -= 1  # because i_total is updated at the end of the inner loop
+            i_skip = _compute_i_skip(i_total, n_burn, n_skip)
+            rt = outer_callback(
+                bart=bart,
+                burnin=i_total < n_burn,
+                overflow=i_total >= n_iters,
+                i_total=i_total,
+                i_skip=i_skip,
+                callback_state=callback_state,
+                n_burn=n_burn,
+                n_save=n_save,
+                n_skip=n_skip,
+                i_outer=i_outer,
+                inner_loop_length=inner_loop_length,
+            )
+            if rt is not None:
+                bart, callback_state = rt
+                i_total += 1
+                carry = (bart, i_total, key, trace_both, trace_onlymain, callback_state)
+    bart, _, _, trace_both, trace_onlymain, _ = carry
+    burnin_trace = tree.map(lambda x: x[:n_burn, ...], trace_both)
+    main_trace = tree.map(lambda x: x[n_burn:, ...], trace_both)
+    main_trace.update(trace_onlymain)
-    def empty_trace(length, bart, tracelist):
-        bart = {k: v for k, v in bart.items() if k in tracelist}
-        return jax.vmap(lambda x: x, in_axes=None, out_axes=0, axis_size=length)(bart)
+    return bart, burnin_trace, main_trace
-    trace_light = empty_trace(n_burn + n_save, bart, tracevars_light)
-    trace_heavy = empty_trace(n_save, bart, tracevars_heavy)
-    callback_kw = dict(n_burn=n_burn, n_save=n_save, n_skip=n_skip)
+def _compute_i_skip(i_total, n_burn, n_skip):
+    burnin = i_total < n_burn
+    return jnp.where(
+        burnin,
+        i_total + 1,
+        (i_total + 1) % n_skip + jnp.where(i_total + 1 < n_skip, n_burn, 0),
+    )
-    carry = (bart, 0, key, trace_light, trace_heavy)
+@functools.partial(jax.jit, donate_argnums=(0,), static_argnums=(1, 2, 3, 4))
+def _run_mcmc_inner_loop(
+    carry,
+    inner_loop_length,
+    inner_callback,
+    onlymain_extractor,
+    both_extractor,
+    n_burn,
+    n_save,
+    n_skip,
+    i_outer,
+):
     def loop(carry, _):
-        bart, i_total, key, trace_light, trace_heavy = carry
+        bart, i_total, key, trace_both, trace_onlymain, callback_state = carry
-        key, subkey = random.split(key)
-        bart = mcmcstep.step(subkey, bart)
+        keys = jaxext.split(key)
+        key = keys.pop()
+        bart = mcmcstep.step(keys.pop(), bart)
         burnin = i_total < n_burn
-        i_skip = jnp.where(
-            burnin,
-            i_total + 1,
-            (i_total + 1) % n_skip + jnp.where(i_total + 1 < n_skip, n_burn, 0),
-        )
-        callback(
-            bart=bart, burnin=burnin, i_total=i_total, i_skip=i_skip, **callback_kw
-        )
-        i_heavy = jnp.where(burnin, 0, (i_total - n_burn) // n_skip)
-        i_light = jnp.where(burnin, i_total, n_burn + i_heavy)
-        def update_trace(index, trace, bart):
-            bart = {k: v for k, v in bart.items() if k in trace}
+        if inner_callback is not None:
+            i_skip = _compute_i_skip(i_total, n_burn, n_skip)
+            rt = inner_callback(
+                bart=bart,
+                burnin=burnin,
+                overflow=i_total >= n_burn + n_save * n_skip,
+                i_total=i_total,
+                i_skip=i_skip,
+                callback_state=callback_state,
+                n_burn=n_burn,
+                n_save=n_save,
+                n_skip=n_skip,
+                i_outer=i_outer,
+                inner_loop_length=inner_loop_length,
+            )
+            if rt is not None:
+                bart, callback_state = rt
+        i_onlymain = jnp.where(burnin, 0, (i_total - n_burn) // n_skip)
+        i_both = jnp.where(burnin, i_total, n_burn + i_onlymain)
+        def update_trace(index, trace, state):
             def assign_at_index(trace_array, state_array):
                 if trace_array.size:
                     return trace_array.at[index, ...].set(state_array)
@@ -147,84 +308,176 @@ def run_mcmc(key, bart, n_burn, n_save, n_skip, callback):
                     # of length 0
                     return trace_array
-            return tree.map(assign_at_index, trace, bart)
+            return tree.map(assign_at_index, trace, state)
-        trace_heavy = update_trace(i_heavy, trace_heavy, bart)
-        trace_light = update_trace(i_light, trace_light, bart)
+        trace_onlymain = update_trace(
+            i_onlymain, trace_onlymain, onlymain_extractor(bart)
+        )
+        trace_both = update_trace(i_both, trace_both, both_extractor(bart))
         i_total += 1
-        carry = (bart, i_total, key, trace_light, trace_heavy)
+        carry = (bart, i_total, key, trace_both, trace_onlymain, callback_state)
         return carry, None
-    carry, _ = lax.scan(loop, carry, None, n_burn + n_skip * n_save)
-    bart, _, _, trace_light, trace_heavy = carry
+    carry, _ = lax.scan(loop, carry, None, inner_loop_length)
+    return carry
-    burnin_trace = tree.map(lambda x: x[:n_burn, ...], trace_light)
-    main_trace = tree.map(lambda x: x[n_burn:, ...], trace_light)
-    main_trace.update(trace_heavy)
-    return bart, burnin_trace, main_trace
-@functools.lru_cache
-# cache to make the callback function object unique, such that the jit
-# of run_mcmc recognizes it
-def make_simple_print_callback(printevery):
+def make_print_callbacks(dot_every_inner=1, report_every_outer=1):
     """
-    Create a logging callback function for MCMC iterations.
+    Prepare logging callbacks for `run_mcmc`.
+    Prepare callbacks which print a dot on every iteration, and a longer
+    report outer loop iteration.
     Parameters
     ----------
-    printevery : int
-        The number of iterations between each log.
+    dot_every_inner : int, default 1
+        A dot is printed every `dot_every_inner` MCMC iterations.
+    report_every_outer : int, default 1
+        A report is printed every `report_every_outer` outer loop
+        iterations.
     Returns
     -------
-    callback : callable
-        A function in the format required by `run_mcmc`.
+    kwargs : dict
+        A dictionary with the arguments to pass to `run_mcmc` as keyword
+        arguments to set up the callbacks.
+    Examples
+    --------
+    >>> run_mcmc(..., **make_print_callbacks())
     """
+    return dict(
+        inner_callback=_print_callback_inner,
+        outer_callback=_print_callback_outer,
+        callback_state=dict(
+            dot_every_inner=dot_every_inner, report_every_outer=report_every_outer
+        ),
+    )
+def _print_callback_inner(*, i_total, callback_state, **_):
+    dot_every_inner = callback_state['dot_every_inner']
+    if dot_every_inner is not None:
+        cond = (i_total + 1) % dot_every_inner == 0
+        debug.callback(_print_dot, cond)
+def _print_dot(cond):
+    if cond:
+        print('.', end='', flush=True)
-    def callback(*, bart, burnin, i_total, i_skip, n_burn, n_save, n_skip):
-        prop_total = len(bart['leaf_trees'])
-        grow_prop = bart['grow_prop_count'] / prop_total
-        prune_prop = bart['prune_prop_count'] / prop_total
-        grow_acc = bart['grow_acc_count'] / bart['grow_prop_count']
-        prune_acc = bart['prune_acc_count'] / bart['prune_prop_count']
-        n_total = n_burn + n_save * n_skip
-        printcond = (i_total + 1) % printevery == 0
+def _print_callback_outer(
+    *,
+    bart,
+    burnin,
+    overflow,
+    i_total,
+    n_burn,
+    n_save,
+    n_skip,
+    callback_state,
+    i_outer,
+    inner_loop_length,
+    **_,
+):
+    report_every_outer = callback_state['report_every_outer']
+    if report_every_outer is not None:
+        dot_every_inner = callback_state['dot_every_inner']
+        if dot_every_inner is None:
+            newline = False
+        else:
+            newline = dot_every_inner < inner_loop_length
         debug.callback(
-            _simple_print_callback,
-            burnin,
-            i_total,
-            n_total,
-            grow_prop,
-            grow_acc,
-            prune_prop,
-            prune_acc,
-            printcond,
+            _print_report,
+            cond=(i_outer + 1) % report_every_outer == 0,
+            newline=newline,
+            burnin=burnin,
+            overflow=overflow,
+            i_total=i_total,
+            n_iters=n_burn + n_save * n_skip,
+            grow_prop_count=bart.forest.grow_prop_count,
+            grow_acc_count=bart.forest.grow_acc_count,
+            prune_prop_count=bart.forest.prune_prop_count,
+            prune_acc_count=bart.forest.prune_acc_count,
+            prop_total=len(bart.forest.leaf_trees),
+            fill=grove.forest_fill(bart.forest.split_trees),
         )
-    return callback
+def _convert_jax_arrays_in_args(func):
+    """Remove jax arrays from a function arguments.
-def _simple_print_callback(
-    burnin, i_total, n_total, grow_prop, grow_acc, prune_prop, prune_acc, printcond
+    Converts all jax.Array instances in the arguments to either Python scalars
+    or numpy arrays.
+    """
+    def convert_jax_arrays(pytree):
+        def convert_jax_arrays(val):
+            if not isinstance(val, jax.Array):
+                return val
+            elif val.shape:
+                return numpy.array(val)
+            else:
+                return val.item()
+        return tree.map(convert_jax_arrays, pytree)
+    @functools.wraps(func)
+    def new_func(*args, **kw):
+        args = convert_jax_arrays(args)
+        kw = convert_jax_arrays(kw)
+        return func(*args, **kw)
+    return new_func
+@_convert_jax_arrays_in_args
+# convert all jax arrays in arguments because operations on them could lead to
+# deadlock with the main thread
+def _print_report(
+    *,
+    cond,
+    newline,
+    burnin,
+    overflow,
+    i_total,
+    n_iters,
+    grow_prop_count,
+    grow_acc_count,
+    prune_prop_count,
+    prune_acc_count,
+    prop_total,
+    fill,
 ):
-    if printcond:
-        burnin_flag = ' (burnin)' if burnin else ''
-        total_str = str(n_total)
-        ndigits = len(total_str)
-        i_str = str(i_total.item() + 1).rjust(ndigits)
-        # I do i_total.item() + 1 instead of just i_total + 1 to solve a bug
-        # originating when jax is combined with some outdated dependencies. (I
-        # did not track down which dependencies exactly.) Doing .item() makes
-        # the + 1 operation be done by Python instead of by jax. The bug is that
-        # jax hangs completely, with a secondary thread blocked at this line.
+    if cond:
+        newline = '\n' if newline else ''
+        def acc_string(acc_count, prop_count):
+            if prop_count:
+                return f'{acc_count / prop_count:.0%}'
+            else:
+                return ' n/d'
+        grow_prop = grow_prop_count / prop_total
+        prune_prop = prune_prop_count / prop_total
+        grow_acc = acc_string(grow_acc_count, grow_prop_count)
+        prune_acc = acc_string(prune_acc_count, prune_prop_count)
+        if burnin:
+            flag = ' (burnin)'
+        elif overflow:
+            flag = ' (overflow)'
+        else:
+            flag = ''
         print(
-            f'Iteration {i_str}/{total_str} '
-            f'P_grow={grow_prop:.2f} P_prune={prune_prop:.2f} '
-            f'A_grow={grow_acc:.2f} A_prune={prune_acc:.2f}{burnin_flag}'
+            f'{newline}It {i_total + 1}/{n_iters} '
+            f'grow P={grow_prop:.0%} A={grow_acc}, '
+            f'prune P={prune_prop:.0%} A={prune_acc}, '
+            f'fill={fill:.0%}{flag}'
         )
@@ -248,11 +501,11 @@ def evaluate_trace(trace, X):
     evaluate_trees = functools.partial(grove.evaluate_forest, sum_trees=False)
     evaluate_trees = jaxext.autobatch(evaluate_trees, 2**29, (None, 0, 0, 0))
-    def loop(_, state):
+    def loop(_, row):
         values = evaluate_trees(
-            X, state['leaf_trees'], state['var_trees'], state['split_trees']
+            X, row['leaf_trees'], row['var_trees'], row['split_trees']
         )
-        return None, jnp.sum(values, axis=0, dtype=jnp.float32)
+        return None, row['offset'] + jnp.sum(values, axis=0, dtype=jnp.float32)
     _, y = lax.scan(loop, None, trace)
     return y

bartz 0.5.0__py3-none-any.whl → 0.6.0__py3-none-any.whl

bartz 0.5.0py3-none-any.whl → 0.6.0py3-none-any.whl