PyPI - dask-array - Versions diffs - 0.1.0__py3-none-any.whl - Mend

dask-array 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (144) hide show

dask_array/__init__.py +228 -0
dask_array/_backends.py +76 -0
dask_array/_backends_array.py +99 -0
dask_array/_blockwise.py +1410 -0
dask_array/_broadcast.py +272 -0
dask_array/_chunk.py +445 -0
dask_array/_chunk_types.py +54 -0
dask_array/_collection.py +1644 -0
dask_array/_concatenate.py +331 -0
dask_array/_core_utils.py +1365 -0
dask_array/_dispatch.py +141 -0
dask_array/_einsum.py +277 -0
dask_array/_expr.py +544 -0
dask_array/_expr_flow.py +586 -0
dask_array/_gufunc.py +805 -0
dask_array/_histogram.py +617 -0
dask_array/_map_blocks.py +652 -0
dask_array/_new_collection.py +10 -0
dask_array/_numpy_compat.py +135 -0
dask_array/_overlap.py +1159 -0
dask_array/_rechunk.py +1050 -0
dask_array/_reshape.py +710 -0
dask_array/_routines.py +102 -0
dask_array/_shuffle.py +448 -0
dask_array/_stack.py +264 -0
dask_array/_svg.py +291 -0
dask_array/_templates.py +29 -0
dask_array/_test_utils.py +257 -0
dask_array/_ufunc.py +385 -0
dask_array/_utils.py +349 -0
dask_array/_visualize.py +223 -0
dask_array/_xarray.py +337 -0
dask_array/core/__init__.py +34 -0
dask_array/core/_blockwise_funcs.py +312 -0
dask_array/core/_conversion.py +422 -0
dask_array/core/_from_graph.py +97 -0
dask_array/creation/__init__.py +71 -0
dask_array/creation/_arange.py +121 -0
dask_array/creation/_diag.py +116 -0
dask_array/creation/_diagonal.py +241 -0
dask_array/creation/_eye.py +103 -0
dask_array/creation/_linspace.py +102 -0
dask_array/creation/_mesh.py +134 -0
dask_array/creation/_ones_zeros.py +454 -0
dask_array/creation/_pad.py +270 -0
dask_array/creation/_repeat.py +55 -0
dask_array/creation/_tile.py +36 -0
dask_array/creation/_tri.py +28 -0
dask_array/creation/_utils.py +296 -0
dask_array/fft.py +320 -0
dask_array/io/__init__.py +39 -0
dask_array/io/_base.py +10 -0
dask_array/io/_from_array.py +257 -0
dask_array/io/_from_delayed.py +95 -0
dask_array/io/_from_graph.py +54 -0
dask_array/io/_from_npy_stack.py +67 -0
dask_array/io/_store.py +336 -0
dask_array/io/_tiledb.py +159 -0
dask_array/io/_to_npy_stack.py +65 -0
dask_array/io/_zarr.py +449 -0
dask_array/linalg/__init__.py +39 -0
dask_array/linalg/_cholesky.py +234 -0
dask_array/linalg/_lu.py +300 -0
dask_array/linalg/_norm.py +94 -0
dask_array/linalg/_qr.py +601 -0
dask_array/linalg/_solve.py +349 -0
dask_array/linalg/_svd.py +394 -0
dask_array/linalg/_tensordot.py +334 -0
dask_array/linalg/_utils.py +74 -0
dask_array/manipulation/__init__.py +45 -0
dask_array/manipulation/_expand.py +321 -0
dask_array/manipulation/_flip.py +92 -0
dask_array/manipulation/_roll.py +78 -0
dask_array/manipulation/_transpose.py +309 -0
dask_array/random/__init__.py +125 -0
dask_array/random/_choice.py +181 -0
dask_array/random/_expr.py +256 -0
dask_array/random/_generator.py +441 -0
dask_array/random/_random_state.py +259 -0
dask_array/random/_utils.py +84 -0
dask_array/reductions/__init__.py +84 -0
dask_array/reductions/_arg_reduction.py +130 -0
dask_array/reductions/_common.py +1082 -0
dask_array/reductions/_cumulative.py +522 -0
dask_array/reductions/_percentile.py +261 -0
dask_array/reductions/_reduction.py +725 -0
dask_array/reductions/_trace.py +56 -0
dask_array/routines/__init__.py +133 -0
dask_array/routines/_apply.py +84 -0
dask_array/routines/_bincount.py +112 -0
dask_array/routines/_broadcast.py +111 -0
dask_array/routines/_coarsen.py +115 -0
dask_array/routines/_diff.py +79 -0
dask_array/routines/_gradient.py +158 -0
dask_array/routines/_indexing.py +65 -0
dask_array/routines/_insert_delete.py +132 -0
dask_array/routines/_misc.py +122 -0
dask_array/routines/_nonzero.py +72 -0
dask_array/routines/_search.py +123 -0
dask_array/routines/_select.py +113 -0
dask_array/routines/_statistics.py +171 -0
dask_array/routines/_topk.py +82 -0
dask_array/routines/_triangular.py +74 -0
dask_array/routines/_unique.py +232 -0
dask_array/routines/_where.py +62 -0
dask_array/slicing/__init__.py +67 -0
dask_array/slicing/_basic.py +550 -0
dask_array/slicing/_blocks.py +138 -0
dask_array/slicing/_bool_index.py +145 -0
dask_array/slicing/_setitem.py +329 -0
dask_array/slicing/_squeeze.py +101 -0
dask_array/slicing/_utils.py +1133 -0
dask_array/slicing/_vindex.py +282 -0
dask_array/stacking/__init__.py +15 -0
dask_array/stacking/_block.py +83 -0
dask_array/stacking/_simple.py +58 -0
dask_array/templates/array.html.j2 +48 -0
dask_array/tests/__init__.py +0 -0
dask_array/tests/conftest.py +22 -0
dask_array/tests/test_api.py +40 -0
dask_array/tests/test_binary_op_chunks.py +107 -0
dask_array/tests/test_coarse_slice_through_blockwise.py +362 -0
dask_array/tests/test_collection.py +799 -0
dask_array/tests/test_creation.py +1102 -0
dask_array/tests/test_expr_flow.py +143 -0
dask_array/tests/test_linalg.py +1130 -0
dask_array/tests/test_map_blocks_multi_output.py +104 -0
dask_array/tests/test_rechunk_pushdown.py +214 -0
dask_array/tests/test_reductions.py +1091 -0
dask_array/tests/test_routines.py +2853 -0
dask_array/tests/test_shuffle_chunks.py +67 -0
dask_array/tests/test_slice_pushdown.py +968 -0
dask_array/tests/test_slice_through_blockwise.py +678 -0
dask_array/tests/test_slice_through_overlap.py +366 -0
dask_array/tests/test_slice_through_reshape.py +272 -0
dask_array/tests/test_slicing.py +839 -0
dask_array/tests/test_transpose_slice_pushdown.py +208 -0
dask_array/tests/test_visualize.py +94 -0
dask_array/tests/test_xarray.py +193 -0
dask_array-0.1.0.dist-info/METADATA +48 -0
dask_array-0.1.0.dist-info/RECORD +144 -0
dask_array-0.1.0.dist-info/WHEEL +4 -0
dask_array-0.1.0.dist-info/entry_points.txt +2 -0
dask_array-0.1.0.dist-info/licenses/LICENSE +29 -0

dask_array/_overlap.py ADDED Viewed

@@ -0,0 +1,1159 @@
+from __future__ import annotations
+import functools
+import warnings
+from functools import reduce
+from numbers import Integral, Number
+from operator import mul
+import numpy as np
+from tlz import concat, get, partial
+from tlz.curried import map
+from dask_array._new_collection import new_collection
+from dask_array import _chunk as chunk
+from dask_array._collection import Array, concatenate
+from dask_array._expr import ArrayExpr, unify_chunks_expr
+from dask_array._map_blocks import map_blocks
+from dask_array.creation import empty_like, full_like, repeat
+from dask_array._shuffle import _calculate_new_chunksizes
+from dask_array._numpy_compat import normalize_axis_tuple
+from dask_array._utils import compute_meta, meta_from_array
+from dask.layers import ArrayOverlapLayer
+from dask.utils import derived_from, ensure_dict
+def _overlap_internal_chunks(original_chunks, axes):
+    """Get new chunks for array with overlap."""
+    chunks = []
+    for i, bds in enumerate(original_chunks):
+        depth = axes.get(i, 0)
+        if isinstance(depth, tuple):
+            left_depth = depth[0]
+            right_depth = depth[1]
+        else:
+            left_depth = depth
+            right_depth = depth
+        if len(bds) == 1:
+            chunks.append(bds)
+        else:
+            left = [bds[0] + right_depth]
+            right = [bds[-1] + left_depth]
+            mid = []
+            for bd in bds[1:-1]:
+                mid.append(bd + left_depth + right_depth)
+            chunks.append(left + mid + right)
+    return chunks
+def overlap_internal(x, axes):
+    """Share boundaries between neighboring blocks
+    Parameters
+    ----------
+    x: da.Array
+        A dask array
+    axes: dict
+        The size of the shared boundary per axis
+    The axes input informs how many cells to overlap between neighboring blocks
+    {0: 2, 2: 5} means share two cells in 0 axis, 5 cells in 2 axis
+    """
+    return new_collection(OverlapInternal(x, axes))
+class OverlapInternal(ArrayExpr):
+    """Low-level overlap expression that shares boundaries between blocks.
+    This is the internal implementation detail. For the user-facing
+    map_overlap operation, see MapOverlap.
+    """
+    _parameters = ["array", "axes"]
+    @functools.cached_property
+    def _meta(self):
+        return meta_from_array(self.array)
+    @functools.cached_property
+    def chunks(self):
+        return tuple(map(tuple, _overlap_internal_chunks(self.array.chunks, self.axes)))
+    @functools.cached_property
+    def _name(self) -> str:
+        return f"overlap-{super()._name}"
+    def _layer(self) -> dict:
+        x = self.array
+        graph = ArrayOverlapLayer(
+            name=x.name,
+            axes=self.axes,
+            chunks=x.chunks,
+            numblocks=x.numblocks,
+            token="-".join(self._name.split("-")[1:]),
+        )
+        return ensure_dict(graph)
+class MapOverlap(ArrayExpr):
+    """Logical expression for the full map_overlap operation.
+    This captures the user's intent: apply func with overlap depth/boundary,
+    optionally trimming the result. Slice pushdown is simple because we
+    understand the semantics.
+    Note: new_axis/drop_axis cases are handled by _map_overlap_direct instead.
+    The expression is lowered to the full pipeline during _lower():
+    rechunk -> boundaries -> overlap_internal -> map_blocks -> trim
+    """
+    _parameters = [
+        "arrays",  # tuple of input ArrayExpr
+        "func",  # callable
+        "depth",  # list of dicts (one per array)
+        "boundary",  # list of dicts (one per array)
+        "trim_output",  # bool
+        "allow_rechunk",  # bool
+        "kwargs",  # dict for map_blocks kwargs
+    ]
+    _defaults = {
+        "trim_output": True,
+        "allow_rechunk": True,
+        "kwargs": None,
+    }
+    @functools.cached_property
+    def _meta(self):
+        # Check for explicit meta
+        meta = self._kwargs.get("meta")
+        if meta is not None:
+            return meta_from_array(meta)
+        # Check for explicit dtype
+        dtype = self._kwargs.get("dtype")
+        if dtype is not None:
+            return np.empty((0,) * self.ndim, dtype=dtype)
+        # Try to infer dtype by calling the function on array collections
+        try:
+            arr_collections = [new_collection(a) for a in self.arrays]
+            meta = compute_meta(self.func, None, *arr_collections)
+            if meta is not None:
+                return meta
+        except Exception:
+            pass
+        # Default to primary (highest-rank) array's meta
+        return meta_from_array(self._get_primary_array())
+    @property
+    def _kwargs(self):
+        return self.kwargs if self.kwargs is not None else {}
+    def _get_primary_array(self):
+        """Get the primary array (highest rank, first if tied) for shape/chunk info."""
+        return max(enumerate(self.arrays), key=lambda x: (x[1].ndim, -x[0]))[1]
+    def _get_primary_index(self):
+        """Get the index of the primary array (highest rank, first if tied)."""
+        return max(enumerate(self.arrays), key=lambda x: (x[1].ndim, -x[0]))[0]
+    @functools.cached_property
+    def shape(self):
+        # Output shape = input shape (no new_axis/drop_axis in this expr)
+        return self._get_primary_array().shape
+    @functools.cached_property
+    def chunks(self):
+        # If allow_rechunk, the input is rechunked to ensure minimum chunk size >= depth
+        primary = self._get_primary_array()
+        primary_idx = self._get_primary_index()
+        if self.allow_rechunk:
+            return _get_overlap_rechunked_chunks(new_collection(primary), self.depth[primary_idx])
+        return primary.chunks
+    @functools.cached_property
+    def _name(self) -> str:
+        return f"map-overlap-{super()._name}"
+    def _simplify_up(self, parent, dependents):
+        """Push slice through MapOverlap.
+        For a slice on MapOverlap:
+        - Non-overlap axes: push slice directly to inputs
+        - Overlap axes: expand slice by depth, push to inputs, leave trim at top
+        """
+        from dask_array.slicing import SliceSlicesIntegers
+        if not isinstance(parent, SliceSlicesIntegers):
+            return None
+        index = parent.index
+        ndim = self.arrays[0].ndim
+        # Don't handle None (newaxis) or integers (dimension reduction)
+        if any(idx is None for idx in index):
+            return None
+        if any(isinstance(idx, Integral) for idx in index):
+            return None
+        # Pad index to full length
+        full_index = list(index) + [slice(None)] * (ndim - len(index))
+        # Build input slices for each input array
+        output_trim_index = []
+        needs_trim = False
+        # Get depth for first array (all arrays should have same depth structure)
+        depth = self.depth[0]
+        for axis in range(ndim):
+            idx = full_index[axis]
+            d = depth.get(axis, 0)
+            # Get actual depth (handle tuple for asymmetric overlap)
+            if isinstance(d, tuple):
+                left_depth, right_depth = d
+                max_depth = max(left_depth, right_depth)
+            else:
+                left_depth = right_depth = max_depth = d
+            if not isinstance(idx, slice):
+                return None  # Unexpected index type
+            if idx == slice(None):
+                output_trim_index.append(slice(None))
+                continue
+            # Normalize the slice
+            dim_size = self.shape[axis]
+            start, stop, step = idx.indices(dim_size)
+            if step != 1:
+                return None  # Don't handle non-unit steps
+            if max_depth == 0:
+                # No overlap on this axis - push directly
+                output_trim_index.append(slice(None))
+            else:
+                # Expand slice by overlap depth for input
+                # But respect array boundaries
+                input_size = self.arrays[0].shape[axis]
+                expanded_start = max(0, start - left_depth)
+                expanded_stop = min(input_size, stop + right_depth)
+                # Replace this axis in full_index with expanded slice
+                full_index[axis] = slice(expanded_start, expanded_stop)
+                # Compute trim slice to get original result
+                trim_start = start - expanded_start
+                trim_stop = trim_start + (stop - start)
+                output_trim_index.append(slice(trim_start, trim_stop))
+                needs_trim = True
+        # Slice all input arrays
+        new_arrays = []
+        for arr in self.arrays:
+            sliced = new_collection(arr)[tuple(full_index)]
+            new_arrays.append(sliced.expr)
+        # Create new MapOverlap with sliced inputs
+        new_expr = MapOverlap(
+            arrays=tuple(new_arrays),
+            func=self.func,
+            depth=self.depth,
+            boundary=self.boundary,
+            trim_output=self.trim_output,
+            allow_rechunk=self.allow_rechunk,
+            kwargs=self.kwargs,
+        )
+        if needs_trim:
+            # Apply trim slice to output
+            return SliceSlicesIntegers(new_expr, tuple(output_trim_index), parent.allow_getitem_optimization)
+        else:
+            return new_expr
+    def _lower(self):
+        """Expand to the full overlap pipeline.
+        This expands to: rechunk -> boundaries -> overlap_internal -> map_blocks -> trim
+        """
+        # Apply overlap to each input array
+        overlapped = []
+        for arr, d, b in zip(self.arrays, self.depth, self.boundary):
+            arr_coll = new_collection(arr)
+            overlapped_arr = overlap(arr_coll, depth=d, boundary=b, allow_rechunk=self.allow_rechunk)
+            overlapped.append(overlapped_arr.expr)
+        # Build map_blocks expression
+        result = map_blocks(self.func, *[new_collection(a) for a in overlapped], **self._kwargs)
+        if self.trim_output:
+            # Find highest-rank array for trim settings
+            i = sorted(enumerate(overlapped), key=lambda v: (v[1].ndim, -v[0]))[-1][0]
+            trim_depth = dict(self.depth[i])
+            trim_boundary = dict(self.boundary[i])
+            result = trim_internal(result, trim_depth, trim_boundary)
+        return result.expr
+def trim_overlap(x, depth, boundary=None):
+    """Trim sides from each block.
+    This couples well with the ``map_overlap`` operation which may leave
+    excess data on each block.
+    See also
+    --------
+    dask.array.overlap.map_overlap
+    """
+    # parameter to be passed to trim_internal
+    axes = coerce_depth(x.ndim, depth)
+    return trim_internal(x, axes=axes, boundary=boundary)
+def trim_internal(x, axes, boundary=None):
+    """Trim sides from each block
+    This couples well with the overlap operation, which may leave excess data on
+    each block
+    See also
+    --------
+    dask.array.chunk.trim
+    dask.array.map_blocks
+    """
+    boundary = coerce_boundary(x.ndim, boundary)
+    olist = []
+    for i, bd in enumerate(x.chunks):
+        bdy = boundary.get(i, "none")
+        overlap = axes.get(i, 0)
+        ilist = []
+        for j, d in enumerate(bd):
+            if bdy != "none":
+                if isinstance(overlap, tuple):
+                    d = d - sum(overlap)
+                else:
+                    d = d - overlap * 2
+            elif isinstance(overlap, tuple):
+                d = d - overlap[0] if j != 0 else d
+                d = d - overlap[1] if j != len(bd) - 1 else d
+            else:
+                d = d - overlap if j != 0 else d
+                d = d - overlap if j != len(bd) - 1 else d
+            ilist.append(d)
+        olist.append(tuple(ilist))
+    chunks = tuple(olist)
+    return map_blocks(
+        partial(_trim, axes=axes, boundary=boundary),
+        x,
+        chunks=chunks,
+        dtype=x.dtype,
+        meta=x._meta,
+    )
+def _trim(x, axes, boundary, _overlap_trim_info):
+    """Similar to dask.array.chunk.trim but requires one to specify the
+    boundary condition.
+    ``axes``, and ``boundary`` are assumed to have been coerced.
+    """
+    chunk_location = _overlap_trim_info[0]
+    num_chunks = _overlap_trim_info[1]
+    axes = [axes.get(i, 0) for i in range(x.ndim)]
+    axes_front = (ax[0] if isinstance(ax, tuple) else ax for ax in axes)
+    axes_back = (
+        (-ax[1] if isinstance(ax, tuple) and ax[1] else -ax if isinstance(ax, Integral) and ax else None) for ax in axes
+    )
+    trim_front = (
+        0 if (chunk_location == 0 and boundary.get(i, "none") == "none") else ax
+        for i, (chunk_location, ax) in enumerate(zip(chunk_location, axes_front))
+    )
+    trim_back = (
+        (None if (chunk_location == chunks - 1 and boundary.get(i, "none") == "none") else ax)
+        for i, (chunks, chunk_location, ax) in enumerate(zip(num_chunks, chunk_location, axes_back))
+    )
+    ind = tuple(slice(front, back) for front, back in zip(trim_front, trim_back))
+    return x[ind]
+def periodic(x, axis, depth):
+    """Copy a slice of an array around to its other side
+    Useful to create periodic boundary conditions for overlap
+    """
+    left = (slice(None, None, None),) * axis + (slice(0, depth),) + (slice(None, None, None),) * (x.ndim - axis - 1)
+    right = (
+        (slice(None, None, None),) * axis + (slice(-depth, None),) + (slice(None, None, None),) * (x.ndim - axis - 1)
+    )
+    l = x[left]
+    r = x[right]
+    l, r = _remove_overlap_boundaries(l, r, axis, depth)
+    return concatenate([r, x, l], axis=axis)
+def reflect(x, axis, depth):
+    """Reflect boundaries of array on the same side
+    This is the converse of ``periodic``
+    """
+    if depth == 1:
+        left = (slice(None, None, None),) * axis + (slice(0, 1),) + (slice(None, None, None),) * (x.ndim - axis - 1)
+    else:
+        left = (
+            (slice(None, None, None),) * axis
+            + (slice(depth - 1, None, -1),)
+            + (slice(None, None, None),) * (x.ndim - axis - 1)
+        )
+    right = (
+        (slice(None, None, None),) * axis
+        + (slice(-1, -depth - 1, -1),)
+        + (slice(None, None, None),) * (x.ndim - axis - 1)
+    )
+    l = x[left]
+    r = x[right]
+    l, r = _remove_overlap_boundaries(l, r, axis, depth)
+    return concatenate([l, x, r], axis=axis)
+def nearest(x, axis, depth):
+    """Each reflect each boundary value outwards
+    This mimics what the skimage.filters.gaussian_filter(... mode="nearest")
+    does.
+    """
+    left = (slice(None, None, None),) * axis + (slice(0, 1),) + (slice(None, None, None),) * (x.ndim - axis - 1)
+    right = (slice(None, None, None),) * axis + (slice(-1, -2, -1),) + (slice(None, None, None),) * (x.ndim - axis - 1)
+    l = repeat(x[left], depth, axis=axis)
+    r = repeat(x[right], depth, axis=axis)
+    l, r = _remove_overlap_boundaries(l, r, axis, depth)
+    return concatenate([l, x, r], axis=axis)
+def constant(x, axis, depth, value):
+    """Add constant slice to either side of array"""
+    chunks = list(x.chunks)
+    chunks[axis] = (depth,)
+    c = full_like(
+        x,
+        value,
+        shape=tuple(map(sum, chunks)),
+        chunks=tuple(chunks),
+        dtype=x.dtype,
+    )
+    return concatenate([c, x, c], axis=axis)
+def _remove_overlap_boundaries(l, r, axis, depth):
+    lchunks = list(l.chunks)
+    lchunks[axis] = (depth,)
+    rchunks = list(r.chunks)
+    rchunks[axis] = (depth,)
+    l = l.rechunk(tuple(lchunks))
+    r = r.rechunk(tuple(rchunks))
+    return l, r
+def boundaries(x, depth=None, kind=None):
+    """Add boundary conditions to an array before overlapping
+    See Also
+    --------
+    periodic
+    constant
+    """
+    if not isinstance(kind, dict):
+        kind = dict.fromkeys(range(x.ndim), kind)
+    if not isinstance(depth, dict):
+        depth = dict.fromkeys(range(x.ndim), depth)
+    for i in range(x.ndim):
+        d = depth.get(i, 0)
+        if d == 0:
+            continue
+        this_kind = kind.get(i, "none")
+        if this_kind == "none":
+            continue
+        elif this_kind == "periodic":
+            x = periodic(x, i, d)
+        elif this_kind == "reflect":
+            x = reflect(x, i, d)
+        elif this_kind == "nearest":
+            x = nearest(x, i, d)
+        elif i in kind:
+            x = constant(x, i, d, kind[i])
+    return x
+def ensure_minimum_chunksize(size, chunks):
+    """Determine new chunks to ensure that every chunk >= size
+    Parameters
+    ----------
+    size: int
+        The maximum size of any chunk.
+    chunks: tuple
+        Chunks along one axis, e.g. ``(3, 3, 2)``
+    Examples
+    --------
+    >>> ensure_minimum_chunksize(10, (20, 20, 1))
+    (20, 11, 10)
+    >>> ensure_minimum_chunksize(3, (1, 1, 3))
+    (5,)
+    See Also
+    --------
+    overlap
+    """
+    if size <= min(chunks):
+        return chunks
+    # add too-small chunks to chunks before them
+    output = []
+    new = 0
+    for c in chunks:
+        if c < size:
+            if new > size + (size - c):
+                output.append(new - (size - c))
+                new = size
+            else:
+                new += c
+        if new >= size:
+            output.append(new)
+            new = 0
+        if c >= size:
+            new += c
+    if new >= size:
+        output.append(new)
+    elif len(output) >= 1:
+        output[-1] += new
+    else:
+        raise ValueError(f"The overlapping depth {size} is larger than your array {sum(chunks)}.")
+    return tuple(output)
+def _get_overlap_rechunked_chunks(x, depth2):
+    depths = [max(d) if isinstance(d, tuple) else d for d in depth2.values()]
+    # rechunk if new chunks are needed to fit depth in every chunk
+    return tuple(ensure_minimum_chunksize(size, c) for size, c in zip(depths, x.chunks))
+def overlap(x, depth, boundary, *, allow_rechunk=True):
+    """Share boundaries between neighboring blocks
+    Parameters
+    ----------
+    x: da.Array
+        A dask array
+    depth: dict
+        The size of the shared boundary per axis
+    boundary: dict
+        The boundary condition on each axis. Options are 'reflect', 'periodic',
+        'nearest', 'none', or an array value.  Such a value will fill the
+        boundary with that value.
+    allow_rechunk: bool, keyword only
+        Allows rechunking, otherwise chunk sizes need to match and core
+        dimensions are to consist only of one chunk.
+    The depth input informs how many cells to overlap between neighboring
+    blocks ``{0: 2, 2: 5}`` means share two cells in 0 axis, 5 cells in 2 axis.
+    Axes missing from this input will not be overlapped.
+    Any axis containing chunks smaller than depth will be rechunked if
+    possible, provided the keyword ``allow_rechunk`` is True (recommended).
+    Examples
+    --------
+    >>> import numpy as np
+    >>> import dask_array as da
+    >>> x = np.arange(64).reshape((8, 8))
+    >>> d = da.from_array(x, chunks=(4, 4))
+    >>> d.chunks
+    ((4, 4), (4, 4))
+    >>> g = da.overlap.overlap(d, depth={0: 2, 1: 1},
+    ...                       boundary={0: 100, 1: 'reflect'})
+    >>> g.chunks
+    ((8, 8), (6, 6))
+    >>> np.array(g)
+    array([[100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100],
+           [100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100],
+           [  0,   0,   1,   2,   3,   4,   3,   4,   5,   6,   7,   7],
+           [  8,   8,   9,  10,  11,  12,  11,  12,  13,  14,  15,  15],
+           [ 16,  16,  17,  18,  19,  20,  19,  20,  21,  22,  23,  23],
+           [ 24,  24,  25,  26,  27,  28,  27,  28,  29,  30,  31,  31],
+           [ 32,  32,  33,  34,  35,  36,  35,  36,  37,  38,  39,  39],
+           [ 40,  40,  41,  42,  43,  44,  43,  44,  45,  46,  47,  47],
+           [ 16,  16,  17,  18,  19,  20,  19,  20,  21,  22,  23,  23],
+           [ 24,  24,  25,  26,  27,  28,  27,  28,  29,  30,  31,  31],
+           [ 32,  32,  33,  34,  35,  36,  35,  36,  37,  38,  39,  39],
+           [ 40,  40,  41,  42,  43,  44,  43,  44,  45,  46,  47,  47],
+           [ 48,  48,  49,  50,  51,  52,  51,  52,  53,  54,  55,  55],
+           [ 56,  56,  57,  58,  59,  60,  59,  60,  61,  62,  63,  63],
+           [100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100],
+           [100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100, 100]])
+    """
+    depth2 = coerce_depth(x.ndim, depth)
+    boundary2 = coerce_boundary(x.ndim, boundary)
+    depths = [max(d) if isinstance(d, tuple) else d for d in depth2.values()]
+    if allow_rechunk:
+        # rechunk if new chunks are needed to fit depth in every chunk
+        x1 = x.rechunk(_get_overlap_rechunked_chunks(x, depth2))  # this is a no-op if x.chunks == new_chunks
+    else:
+        original_chunks_too_small = any(min(c) < d for d, c in zip(depths, x.chunks))
+        if original_chunks_too_small:
+            raise ValueError(
+                "Overlap depth is larger than smallest chunksize.\n"
+                "Please set allow_rechunk=True to rechunk automatically.\n"
+                f"Overlap depths required: {depths}\n"
+                f"Input chunks: {x.chunks}\n"
+            )
+        x1 = x
+    x2 = boundaries(x1, depth2, boundary2)
+    x3 = overlap_internal(x2, depth2)
+    trim = {k: v * 2 if boundary2.get(k, "none") != "none" else 0 for k, v in depth2.items()}
+    x4 = chunk.trim(x3, trim)
+    return x4
+def add_dummy_padding(x, depth, boundary):
+    """
+    Pads an array which has 'none' as the boundary type.
+    Used to simplify trimming arrays which use 'none'.
+    >>> import dask_array as da
+    >>> x = da.arange(6, chunks=3)
+    >>> add_dummy_padding(x, {0: 1}, {0: 'none'}).compute()  # doctest: +NORMALIZE_WHITESPACE
+    array([..., 0, 1, 2, 3, 4, 5, ...])
+    """
+    for k, v in boundary.items():
+        d = depth.get(k, 0)
+        if v == "none" and d > 0:
+            empty_shape = list(x.shape)
+            empty_shape[k] = d
+            empty_chunks = list(x.chunks)
+            empty_chunks[k] = (d,)
+            empty = empty_like(
+                getattr(x, "_meta", x),
+                shape=empty_shape,
+                chunks=empty_chunks,
+                dtype=x.dtype,
+            )
+            out_chunks = list(x.chunks)
+            ax_chunks = list(out_chunks[k])
+            ax_chunks[0] += d
+            ax_chunks[-1] += d
+            out_chunks[k] = tuple(ax_chunks)
+            x = concatenate([empty, x, empty], axis=k)
+            x = x.rechunk(out_chunks)
+    return x
+def _map_overlap_direct(func, args, depth, boundary, trim, allow_rechunk, kwargs):
+    """Direct implementation of map_overlap without MapOverlap.
+    Used for cases with new_axis/drop_axis where MapOverlap doesn't apply.
+    """
+    # Apply overlap to each input array
+    overlapped = []
+    for x, d, b in zip(args, depth, boundary):
+        overlapped.append(overlap(x, depth=d, boundary=b, allow_rechunk=allow_rechunk))
+    # Apply the function via map_blocks
+    result = map_blocks(func, *overlapped, **kwargs)
+    if trim:
+        # Find highest-rank array for trim settings
+        i = sorted(enumerate(overlapped), key=lambda v: (v[1].ndim, -v[0]))[-1][0]
+        trim_depth = dict(depth[i])
+        trim_boundary = dict(boundary[i])
+        # Handle drop_axis
+        drop_axis = kwargs.get("drop_axis")
+        if drop_axis is not None:
+            if isinstance(drop_axis, Number):
+                drop_axis = [drop_axis]
+            ndim_out = max(a.ndim for a in overlapped)
+            drop_axis = [d % ndim_out for d in drop_axis]
+            kept_axes = tuple(ax for ax in range(overlapped[i].ndim) if ax not in drop_axis)
+            trim_depth = {n: trim_depth[ax] for n, ax in enumerate(kept_axes)}
+            trim_boundary = {n: trim_boundary[ax] for n, ax in enumerate(kept_axes)}
+        # Handle new_axis
+        new_axis = kwargs.get("new_axis")
+        if new_axis is not None:
+            if isinstance(new_axis, Number):
+                new_axis = [new_axis]
+            ndim_out = max(a.ndim for a in overlapped)
+            new_axis = [d % ndim_out for d in new_axis]
+            for axis in new_axis:
+                for existing_axis in list(trim_depth.keys()):
+                    if existing_axis >= axis:
+                        trim_depth[existing_axis + 1] = trim_depth[existing_axis]
+                        trim_boundary[existing_axis + 1] = trim_boundary[existing_axis]
+                trim_depth[axis] = 0
+                trim_boundary[axis] = "none"
+        result = trim_internal(result, trim_depth, trim_boundary)
+    return result
+def map_overlap(
+    func,
+    *args,
+    depth=None,
+    boundary=None,
+    trim=True,
+    align_arrays=True,
+    allow_rechunk=True,
+    **kwargs,
+):
+    """Map a function over blocks of arrays with some overlap
+    We share neighboring zones between blocks of the array, map a
+    function, and then trim away the neighboring strips. If depth is
+    larger than any chunk along a particular axis, then the array is
+    rechunked.
+    Note that this function will attempt to automatically determine the output
+    array type before computing it, please refer to the ``meta`` keyword argument
+    in ``map_blocks`` if you expect that the function will not succeed when
+    operating on 0-d arrays.
+    Parameters
+    ----------
+    func: function
+        The function to apply to each extended block.
+        If multiple arrays are provided, then the function should expect to
+        receive chunks of each array in the same order.
+    args : dask arrays
+    depth: int, tuple, dict or list, keyword only
+        The number of elements that each block should share with its neighbors
+        If a tuple or dict then this can be different per axis.
+        If a list then each element of that list must be an int, tuple or dict
+        defining depth for the corresponding array in `args`.
+        Asymmetric depths may be specified using a dict value of (-/+) tuples.
+        Note that asymmetric depths are currently only supported when
+        ``boundary`` is 'none'.
+        The default value is 0.
+    boundary: str, tuple, dict or list, keyword only
+        How to handle the boundaries.
+        Values include 'reflect', 'periodic', 'nearest', 'none',
+        or any constant value like 0 or np.nan.
+        If a list then each element must be a str, tuple or dict defining the
+        boundary for the corresponding array in `args`.
+        The default value is 'reflect'.
+    trim: bool, keyword only
+        Whether or not to trim ``depth`` elements from each block after
+        calling the map function.
+        Set this to False if your mapping function already does this for you
+    align_arrays: bool, keyword only
+        Whether or not to align chunks along equally sized dimensions when
+        multiple arrays are provided.  This allows for larger chunks in some
+        arrays to be broken into smaller ones that match chunk sizes in other
+        arrays such that they are compatible for block function mapping. If
+        this is false, then an error will be thrown if arrays do not already
+        have the same number of blocks in each dimension.
+    allow_rechunk: bool, keyword only
+        Allows rechunking, otherwise chunk sizes need to match and core
+        dimensions are to consist only of one chunk.
+    **kwargs:
+        Other keyword arguments valid in ``map_blocks``
+    Examples
+    --------
+    >>> import numpy as np
+    >>> import dask_array as da
+    >>> x = np.array([1, 1, 2, 3, 3, 3, 2, 1, 1])
+    >>> x = da.from_array(x, chunks=5)
+    >>> def derivative(x):
+    ...     return x - np.roll(x, 1)
+    >>> y = x.map_overlap(derivative, depth=1, boundary=0)
+    >>> y.compute()
+    array([ 1,  0,  1,  1,  0,  0, -1, -1,  0])
+    >>> x = np.arange(16).reshape((4, 4))
+    >>> d = da.from_array(x, chunks=(2, 2))
+    >>> d.map_overlap(lambda x: x + x.size, depth=1, boundary='reflect').compute()
+    array([[16, 17, 18, 19],
+           [20, 21, 22, 23],
+           [24, 25, 26, 27],
+           [28, 29, 30, 31]])
+    >>> func = lambda x: x + x.size
+    >>> depth = {0: 1, 1: 1}
+    >>> boundary = {0: 'reflect', 1: 'none'}
+    >>> d.map_overlap(func, depth, boundary).compute()  # doctest: +NORMALIZE_WHITESPACE
+    array([[12,  13,  14,  15],
+           [16,  17,  18,  19],
+           [20,  21,  22,  23],
+           [24,  25,  26,  27]])
+    The ``da.map_overlap`` function can also accept multiple arrays.
+    >>> func = lambda x, y: x + y
+    >>> x = da.arange(8).reshape(2, 4).rechunk((1, 2))
+    >>> y = da.arange(4).rechunk(2)
+    >>> da.map_overlap(func, x, y, depth=1, boundary='reflect').compute() # doctest: +NORMALIZE_WHITESPACE
+    array([[ 0,  2,  4,  6],
+           [ 4,  6,  8,  10]])
+    When multiple arrays are given, they do not need to have the
+    same number of dimensions but they must broadcast together.
+    Arrays are aligned block by block (just as in ``da.map_blocks``)
+    so the blocks must have a common chunk size.  This common chunking
+    is determined automatically as long as ``align_arrays`` is True.
+    >>> x = da.arange(8, chunks=4)
+    >>> y = da.arange(8, chunks=2)
+    >>> r = da.map_overlap(func, x, y, depth=1, boundary='reflect', align_arrays=True)
+    >>> len(r.to_delayed())
+    4
+    >>> da.map_overlap(func, x, y, depth=1, boundary='reflect', align_arrays=False).compute()
+    Traceback (most recent call last):
+        ...
+    ValueError: Shapes do not align {'.0': {2, 4}}
+    Note also that this function is equivalent to ``map_blocks``
+    by default.  A non-zero ``depth`` must be defined for any
+    overlap to appear in the arrays provided to ``func``.
+    >>> func = lambda x: x.sum()
+    >>> x = da.ones(10, dtype='int')
+    >>> block_args = dict(chunks=(), drop_axis=0)
+    >>> da.map_blocks(func, x, **block_args).compute()
+    np.int64(10)
+    >>> da.map_overlap(func, x, **block_args, boundary='reflect').compute()
+    np.int64(10)
+    >>> da.map_overlap(func, x, **block_args, depth=1, boundary='reflect').compute()
+    np.int64(12)
+    For functions that may not handle 0-d arrays, it's also possible to specify
+    ``meta`` with an empty array matching the type of the expected result. In
+    the example below, ``func`` will result in an ``IndexError`` when computing
+    ``meta``:
+    >>> x = np.arange(16).reshape((4, 4))
+    >>> d = da.from_array(x, chunks=(2, 2))
+    >>> y = d.map_overlap(lambda x: x + x[2], depth=1, boundary='reflect', meta=np.array(()))
+    >>> y
+    dask.array<_trim, shape=(4, 4), dtype=float64, chunksize=(2, 2), chunktype=numpy.ndarray>
+    >>> y.compute()
+    array([[ 4,  6,  8, 10],
+           [ 8, 10, 12, 14],
+           [20, 22, 24, 26],
+           [24, 26, 28, 30]])
+    Similarly, it's possible to specify a non-NumPy array to ``meta``:
+    >>> import cupy  # doctest: +SKIP
+    >>> x = cupy.arange(16).reshape((4, 4))  # doctest: +SKIP
+    >>> d = da.from_array(x, chunks=(2, 2))  # doctest: +SKIP
+    >>> y = d.map_overlap(lambda x: x + x[2], depth=1, boundary='reflect', meta=cupy.array(()))  # doctest: +SKIP
+    >>> y  # doctest: +SKIP
+    dask.array<_trim, shape=(4, 4), dtype=float64, chunksize=(2, 2), chunktype=cupy.ndarray>
+    >>> y.compute()  # doctest: +SKIP
+    array([[ 4,  6,  8, 10],
+           [ 8, 10, 12, 14],
+           [20, 22, 24, 26],
+           [24, 26, 28, 30]])
+    """
+    # Look for invocation using deprecated single-array signature
+    # map_overlap(x, func, depth, boundary=None, trim=True, **kwargs)
+    if isinstance(func, Array) and callable(args[0]):
+        warnings.warn(
+            "The use of map_overlap(array, func, **kwargs) is deprecated since dask 2.17.0 "
+            "and will be an error in a future release. To silence this warning, use the syntax "
+            "map_overlap(func, array0,[ array1, ...,] **kwargs) instead.",
+            FutureWarning,
+        )
+        sig = ["func", "depth", "boundary", "trim"]
+        depth = get(sig.index("depth"), args, depth)
+        boundary = get(sig.index("boundary"), args, boundary)
+        trim = get(sig.index("trim"), args, trim)
+        func, args = args[0], [func]
+    if not callable(func):
+        raise TypeError(
+            f"First argument must be callable function, not {type(func).__name__}\n"
+            "Usage:   da.map_overlap(function, x)\n"
+            "   or:   da.map_overlap(function, x, y, z)"
+        )
+    if not all(isinstance(x, Array) for x in args):
+        raise TypeError(
+            f"All variadic arguments must be arrays, not {[type(x).__name__ for x in args]}\n"
+            "Usage:   da.map_overlap(function, x)\n"
+            "   or:   da.map_overlap(function, x, y, z)"
+        )
+    # Coerce depth and boundary arguments to lists of individual
+    # specifications for each array argument
+    def coerce(xs, arg, fn):
+        if not isinstance(arg, list):
+            arg = [arg] * len(xs)
+        return [fn(x.ndim, a) for x, a in zip(xs, arg)]
+    depth = coerce(args, depth, coerce_depth)
+    boundary = coerce(args, boundary, coerce_boundary)
+    # Align chunks in each array to a common size
+    if align_arrays:
+        # Reverse unification order to allow block broadcasting
+        inds = [list(reversed(range(x.ndim))) for x in args]
+        args = [a.expr for a in args]
+        _, args, _ = unify_chunks_expr(*list(concat(zip(args, inds))))
+        args = [new_collection(a) for a in args]
+    # Escape to map_blocks if depth is zero (a more efficient computation)
+    if all(all(depth_val == 0 for depth_val in d.values()) for d in depth):
+        return map_blocks(func, *args, **kwargs)
+    for i, x in enumerate(args):
+        for j in range(x.ndim):
+            if isinstance(depth[i][j], tuple) and boundary[i][j] != "none":
+                raise NotImplementedError(
+                    "Asymmetric overlap is currently only implemented "
+                    "for boundary='none', however boundary for dimension "
+                    f"{j} in array argument {i} is {boundary[i][j]}"
+                )
+    def assert_int_chunksize(xs):
+        assert all(type(c) is int for x in xs for cc in x.chunks for c in cc)
+    assert_int_chunksize(args)
+    # Validate chunk sizes if rechunking is not allowed
+    if not allow_rechunk:
+        for x, d in zip(args, depth):
+            depths = [max(dd) if isinstance(dd, tuple) else dd for dd in d.values()]
+            original_chunks_too_small = any(min(c) < dd for dd, c in zip(depths, x.chunks))
+            if original_chunks_too_small:
+                raise ValueError(
+                    "Overlap depth is larger than smallest chunksize.\n"
+                    "Please set allow_rechunk=True to rechunk automatically.\n"
+                    f"Overlap depths required: {depths}\n"
+                    f"Input chunks: {x.chunks}\n"
+                )
+    # Fall back to direct implementation for complex cases:
+    # - new_axis/drop_axis: change dimensionality
+    # - explicit chunks: change output shape/chunks
+    if kwargs.get("new_axis") is not None or kwargs.get("drop_axis") is not None or kwargs.get("chunks") is not None:
+        return _map_overlap_direct(func, args, depth, boundary, trim, allow_rechunk, kwargs)
+    # Create the logical MapOverlap
+    # It will be lowered to the full pipeline during optimization
+    return new_collection(
+        MapOverlap(
+            arrays=tuple(a.expr for a in args),
+            func=func,
+            depth=depth,
+            boundary=boundary,
+            trim_output=trim,
+            allow_rechunk=allow_rechunk,
+            kwargs=kwargs if kwargs else None,
+        )
+    )
+def coerce_depth(ndim, depth):
+    default = 0
+    if depth is None:
+        depth = default
+    if isinstance(depth, Integral):
+        depth = (depth,) * ndim
+    if isinstance(depth, tuple):
+        depth = dict(zip(range(ndim), depth))
+    if isinstance(depth, dict):
+        depth = {ax: depth.get(ax, default) for ax in range(ndim)}
+    return coerce_depth_type(ndim, depth)
+def coerce_depth_type(ndim, depth):
+    for i in range(ndim):
+        if isinstance(depth[i], tuple):
+            depth[i] = tuple(int(d) for d in depth[i])
+        else:
+            depth[i] = int(depth[i])
+    return depth
+def coerce_boundary(ndim, boundary):
+    default = "none"
+    if boundary is None:
+        boundary = default
+    if not isinstance(boundary, (tuple, dict)):
+        boundary = (boundary,) * ndim
+    if isinstance(boundary, tuple):
+        boundary = dict(zip(range(ndim), boundary))
+    if isinstance(boundary, dict):
+        boundary = {ax: boundary.get(ax, default) for ax in range(ndim)}
+    return boundary
+@derived_from(np.lib.stride_tricks)
+def sliding_window_view(x, window_shape, axis=None, automatic_rechunk=True):
+    window_shape = tuple(window_shape) if np.iterable(window_shape) else (window_shape,)
+    window_shape_array = np.array(window_shape)
+    if np.any(window_shape_array <= 0):
+        raise ValueError("`window_shape` must contain values > 0")
+    if axis is None:
+        axis = tuple(range(x.ndim))
+        if len(window_shape) != len(axis):
+            raise ValueError(
+                f"Since axis is `None`, must provide "
+                f"window_shape for all dimensions of `x`; "
+                f"got {len(window_shape)} window_shape elements "
+                f"and `x.ndim` is {x.ndim}."
+            )
+    else:
+        axis = normalize_axis_tuple(axis, x.ndim, allow_duplicate=True)
+        if len(window_shape) != len(axis):
+            raise ValueError(
+                f"Must provide matching length window_shape and "
+                f"axis; got {len(window_shape)} window_shape "
+                f"elements and {len(axis)} axes elements."
+            )
+    depths = [0] * x.ndim
+    for ax, window in zip(axis, window_shape):
+        depths[ax] += window - 1
+    # Ensure that each chunk is big enough to leave at least a size-1 chunk
+    # after windowing (this is only really necessary for the last chunk).
+    safe_chunks = list(ensure_minimum_chunksize(d + 1, c) for d, c in zip(depths, x.chunks))
+    if automatic_rechunk:
+        safe_chunks = [s if d != 0 else c for d, c, s in zip(depths, x.chunks, safe_chunks)]
+        # safe chunks is our output chunks, so add the new dimensions
+        safe_chunks.extend([(w,) for w in window_shape])
+        max_chunk = reduce(mul, map(max, x.chunks))
+        new_chunks = _calculate_new_chunksizes(
+            x.chunks,
+            safe_chunks.copy(),
+            {i for i, d in enumerate(depths) if d == 0},
+            max_chunk,
+        )
+        x = x.rechunk(tuple(new_chunks))
+    else:
+        x = x.rechunk(tuple(safe_chunks))
+    # result.shape = x_shape_trimmed + window_shape,
+    # where x_shape_trimmed is x.shape with every entry
+    # reduced by one less than the corresponding window size.
+    # trim chunks to match x_shape_trimmed
+    newchunks = tuple(c[:-1] + (c[-1] - d,) for d, c in zip(depths, x.chunks)) + tuple(
+        (window,) for window in window_shape
+    )
+    return map_overlap(
+        np.lib.stride_tricks.sliding_window_view,
+        x,
+        depth=tuple((0, d) for d in depths),  # Overlap on +ve side only
+        boundary="none",
+        meta=x._meta,
+        new_axis=range(x.ndim, x.ndim + len(axis)),
+        chunks=newchunks,
+        trim=False,
+        align_arrays=False,
+        window_shape=window_shape,
+        axis=axis,
+    )
+def _fill_with_last_one(a, b):
+    """Fill NaN values in b with values from a."""
+    return np.where(~np.isnan(b), b, a)
+def _push(array, n=None, axis=-1):
+    """Apply bottleneck.push to a single chunk."""
+    import bottleneck as bn
+    limit = n if n is not None else array.shape[axis]
+    return bn.push(array, limit, axis)
+def push(array, n, axis):
+    """
+    Dask-version of bottleneck.push
+    Forward fill NaN values along an axis.
+    .. note::
+        Requires bottleneck to be installed.
+    """
+    import dask_array as da
+    from dask._compatibility import import_optional_dependency
+    import_optional_dependency("bottleneck", min_version="1.3.7")
+    if n is not None and 0 < n < array.shape[axis] - 1:
+        arr = da.broadcast_to(
+            da.arange(array.shape[axis], chunks=array.chunks[axis], dtype=array.dtype).reshape(
+                tuple(size if i == axis else 1 for i, size in enumerate(array.shape))
+            ),
+            array.shape,
+            array.chunks,
+        )
+        valid_arange = da.where(da.notnull(array), arr, np.nan)
+        valid_limits = (arr - push(valid_arange, None, axis)) <= n
+        # omit the forward fill that violate the limit
+        return da.where(valid_limits, push(array, None, axis), np.nan)
+    from dask_array.reductions import cumreduction
+    return cumreduction(
+        func=_push,
+        binop=_fill_with_last_one,
+        ident=np.nan,
+        x=array,
+        axis=axis,
+        dtype=array.dtype,
+    )