PyPI - effectful - Versions diffs - 0.0.1__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

effectful 0.0.1py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

effectful/handlers/indexed.py +27 -46
effectful/handlers/jax/__init__.py +14 -0
effectful/handlers/jax/_handlers.py +293 -0
effectful/handlers/jax/_terms.py +502 -0
effectful/handlers/jax/numpy/__init__.py +23 -0
effectful/handlers/jax/numpy/linalg.py +13 -0
effectful/handlers/jax/scipy/special.py +11 -0
effectful/handlers/numpyro.py +562 -0
effectful/handlers/pyro.py +565 -214
effectful/handlers/torch.py +321 -169
effectful/internals/runtime.py +6 -13
effectful/internals/tensor_utils.py +32 -0
effectful/internals/unification.py +900 -0
effectful/ops/semantics.py +104 -84
effectful/ops/syntax.py +1276 -167
effectful/ops/types.py +141 -35
{effectful-0.0.1.dist-info → effectful-0.2.0.dist-info}/METADATA +65 -57
effectful-0.2.0.dist-info/RECORD +26 -0
{effectful-0.0.1.dist-info → effectful-0.2.0.dist-info}/WHEEL +1 -1
effectful/handlers/numbers.py +0 -259
effectful/internals/base_impl.py +0 -259
effectful-0.0.1.dist-info/RECORD +0 -19
{effectful-0.0.1.dist-info → effectful-0.2.0.dist-info/licenses}/LICENSE.md +0 -0
{effectful-0.0.1.dist-info → effectful-0.2.0.dist-info}/top_level.txt +0 -0

effectful/handlers/pyro.py CHANGED Viewed

@@ -1,35 +1,46 @@
+import functools
 import typing
-import warnings
-from typing import Any, Collection, List, Mapping, Optional, Tuple
+from collections.abc import Collection, Mapping
+from typing import Any
+import pyro.poutine.subsample_messenger
 try:
     import pyro
 except ImportError:
     raise ImportError("Pyro is required to use effectful.handlers.pyro.")
+import pyro.distributions as dist
+from pyro.distributions.torch_distribution import (
+    TorchDistribution,
+    TorchDistributionMixin,
+)
 try:
     import torch
 except ImportError:
     raise ImportError("PyTorch is required to use effectful.handlers.pyro.")
-from typing_extensions import ParamSpec
-from effectful.handlers.torch import Indexable, sizesof, to_tensor
-from effectful.ops.syntax import defop
-from effectful.ops.types import Operation
-P = ParamSpec("P")
+from effectful.handlers.torch import (
+    bind_dims,
+    sizesof,
+    unbind_dims,
+)
+from effectful.internals.runtime import interpreter
+from effectful.ops.semantics import apply, runner, typeof
+from effectful.ops.syntax import defdata, defop, defterm
+from effectful.ops.types import NotHandled, Operation, Term
 @defop
 def pyro_sample(
     name: str,
-    fn: pyro.distributions.torch_distribution.TorchDistributionMixin,
+    fn: TorchDistributionMixin,
     *args,
-    obs: Optional[torch.Tensor] = None,
-    obs_mask: Optional[torch.BoolTensor] = None,
-    mask: Optional[torch.BoolTensor] = None,
-    infer: Optional[pyro.poutine.runtime.InferDict] = None,
+    obs: torch.Tensor | None = None,
+    obs_mask: torch.BoolTensor | None = None,
+    mask: torch.BoolTensor | None = None,
+    infer: pyro.poutine.runtime.InferDict | None = None,
     **kwargs,
 ) -> torch.Tensor:
     """
@@ -41,6 +52,39 @@ def pyro_sample(
         )
+class Naming:
+    """
+    A mapping from dimensions (indexed from the right) to names.
+    """
+    def __init__(self, name_to_dim: Mapping[Operation[[], torch.Tensor], int]):
+        assert all(v < 0 for v in name_to_dim.values())
+        self.name_to_dim = name_to_dim
+    @staticmethod
+    def from_shape(
+        names: Collection[Operation[[], torch.Tensor]], event_dims: int
+    ) -> "Naming":
+        """Create a naming from a set of indices and the number of event dimensions.
+        The resulting naming converts tensors of shape
+        ``| batch_shape | named | event_shape |``
+        to tensors of shape ``| batch_shape | event_shape |, | named |``.
+        """
+        assert event_dims >= 0
+        return Naming({n: -event_dims - len(names) + i for i, n in enumerate(names)})
+    def apply(self, value: torch.Tensor) -> torch.Tensor:
+        indexes: list[Any] = [slice(None)] * (len(value.shape))
+        for n, d in self.name_to_dim.items():
+            indexes[len(value.shape) + d] = n()
+        return value[tuple(indexes)]
+    def __repr__(self):
+        return f"Naming({self.name_to_dim})"
 class PyroShim(pyro.poutine.messenger.Messenger):
     """Pyro handler that wraps all sample sites in a custom effectful type.
@@ -81,17 +125,24 @@ class PyroShim(pyro.poutine.messenger.Messenger):
     Sampled y
     """
-    _current_site: Optional[str]
+    # Tracks the named dimensions on any sample site that we have handled.
+    # Ideally, this information would be carried on the sample message itself.
+    # However, when using guides, sample sites are completely replaced by fresh
+    # guide sample sites that do not carry the same infer dict.
+    #
+    # We can only restore the named dimensions on samples that we have handled
+    # at least once in the shim.
+    _index_naming: dict[str, Naming]
-    def __enter__(self):
-        if any(isinstance(m, PyroShim) for m in pyro.poutine.runtime._PYRO_STACK):
-            warnings.warn("PyroShim should be installed at most once.")
-        return super().__enter__()
+    def __init__(self):
+        self._index_naming = {}
     @staticmethod
     def _broadcast_to_named(
-        t: torch.Tensor, shape: torch.Size, indices: Mapping[Operation[[], int], int]
-    ) -> Tuple[torch.Tensor, "Naming"]:
+        t: torch.Tensor,
+        shape: torch.Size,
+        indices: Mapping[Operation[[], torch.Tensor], int],
+    ) -> tuple[torch.Tensor, "Naming"]:
         """Convert a tensor `t` to a fully positional tensor that is
         broadcastable with the positional representation of tensors of shape
         |shape|, |indices|.
@@ -99,6 +150,9 @@ class PyroShim(pyro.poutine.messenger.Messenger):
         """
         t_indices = sizesof(t)
+        if not isinstance(t, torch.Tensor):
+            t = torch.tensor(t)
         if len(t.shape) < len(shape):
             t = t.expand(shape)
@@ -106,7 +160,7 @@ class PyroShim(pyro.poutine.messenger.Messenger):
         name_to_dim = {}
         for i, (k, v) in enumerate(reversed(list(indices.items()))):
             if k in t_indices:
-                t = to_tensor(t, [k])
+                t = bind_dims(t, k)
             else:
                 t = t.expand((v,) + t.shape)
             name_to_dim[k] = -len(shape) - i - 1
@@ -114,7 +168,7 @@ class PyroShim(pyro.poutine.messenger.Messenger):
         # create a positional dimension for every remaining named index in `t`
         n_batch_and_dist_named = len(t.shape)
         for i, k in enumerate(reversed(list(sizesof(t).keys()))):
-            t = to_tensor(t, [k])
+            t = bind_dims(t, k)
             name_to_dim[k] = -n_batch_and_dist_named - i - 1
         return t, Naming(name_to_dim)
@@ -124,26 +178,47 @@ class PyroShim(pyro.poutine.messenger.Messenger):
             assert msg["type"] == "sample"
             assert msg["name"] is not None
             assert msg["infer"] is not None
-            assert isinstance(
-                msg["fn"], pyro.distributions.torch_distribution.TorchDistributionMixin
-            )
+            assert isinstance(msg["fn"], TorchDistributionMixin)
         if pyro.poutine.util.site_is_subsample(msg) or pyro.poutine.util.site_is_factor(
             msg
         ):
             return
-        if getattr(self, "_current_site", None) == msg["name"]:
-            if "_markov_scope" in msg["infer"] and self._current_site:
-                msg["infer"]["_markov_scope"].pop(self._current_site, None)
+        if "pyro_shim_status" in msg["infer"]:
+            handler_id, handler_stage = msg["infer"]["pyro_shim_status"]  # type: ignore
+        else:
+            handler_id = id(self)
+            handler_stage = 0
+            msg["infer"]["pyro_shim_status"] = (handler_id, handler_stage)  # type: ignore
+        if handler_id != id(self):  # Never handle a message that is not ours.
+            return
+        assert handler_stage in (0, 1)
+        # PyroShim turns each call to pyro.sample into two calls. The first
+        # dispatches to pyro_sample and the effectful stack. The effectful stack
+        # eventually calls pyro.sample again. We use state in PyroShim to
+        # recognize that we've been called twice, and we dispatch to the pyro
+        # stack.
+        #
+        # This branch handles the second call, so it massages the message to be
+        # compatible with Pyro. In particular, it removes all named dimensions
+        # and stores naming information in the message. Names are replaced by
+        # _pyro_post_sample.
+        if handler_stage == 1:
+            if "_markov_scope" in msg["infer"]:
+                msg["infer"]["_markov_scope"].pop(msg["name"], None)
             dist = msg["fn"]
             obs = msg["value"] if msg["is_observed"] else None
             # pdist shape: | named1 | batch_shape | event_shape |
             # obs shape: | batch_shape | event_shape |, | named2 | where named2 may overlap named1
-            pdist = PositionalDistribution(dist)
-            naming = pdist.naming
+            indices = sizesof(dist)
+            naming = Naming.from_shape(indices, len(dist.shape()))
+            pdist = bind_dims(dist, *indices.keys())
             if msg["mask"] is None:
                 mask = torch.tensor(True)
@@ -152,290 +227,566 @@ class PyroShim(pyro.poutine.messenger.Messenger):
             else:
                 mask = msg["mask"]
-            pos_mask, _ = PyroShim._broadcast_to_named(
-                mask, dist.batch_shape, pdist.indices
+            assert set(sizesof(mask).keys()) <= (
+                set(indices.keys()) | set(sizesof(obs).keys())
             )
+            pos_mask, _ = PyroShim._broadcast_to_named(mask, dist.batch_shape, indices)
-            pos_obs: Optional[torch.Tensor] = None
+            pos_obs: torch.Tensor | None = None
             if obs is not None:
                 pos_obs, naming = PyroShim._broadcast_to_named(
-                    obs, dist.shape(), pdist.indices
+                    obs, dist.shape(), indices
                 )
+            # Each of the batch dimensions on the distribution gets a
+            # cond_indep_stack frame.
             for var, dim in naming.name_to_dim.items():
-                frame = pyro.poutine.indep_messenger.CondIndepStackFrame(
-                    name=str(var), dim=dim, size=-1, counter=0
-                )
-                msg["cond_indep_stack"] = (frame,) + msg["cond_indep_stack"]
+                # There can be additional batch dimensions on the observation
+                # that do not get frames, so only consider dimensions on the
+                # distribution.
+                if var in indices:
+                    frame = pyro.poutine.indep_messenger.CondIndepStackFrame(
+                        name=f"__index_plate_{var}",
+                        # dims are indexed from the right of the batch shape
+                        dim=dim + len(pdist.event_shape),
+                        size=indices[var],
+                        counter=0,
+                    )
+                    msg["cond_indep_stack"] = (frame,) + msg["cond_indep_stack"]
             msg["fn"] = pdist
             msg["value"] = pos_obs
             msg["mask"] = pos_mask
-            msg["infer"]["_index_naming"] = naming  # type: ignore
+            # stash the index naming on the sample message so that future
+            # consumers of the trace can get at it
+            msg["_index_naming"] = naming  # type: ignore
+            self._index_naming[msg["name"]] = naming
             assert sizesof(msg["value"]) == {}
             assert sizesof(msg["mask"]) == {}
-            return
+        # This branch handles the first call to pyro.sample by calling pyro_sample.
+        else:
+            infer = msg["infer"].copy()
+            infer["pyro_shim_status"] = (handler_id, 1)  # type: ignore
-        try:
-            self._current_site = msg["name"]
             msg["value"] = pyro_sample(
                 msg["name"],
                 msg["fn"],
                 obs=msg["value"] if msg["is_observed"] else None,
-                infer=msg["infer"].copy(),
+                infer=infer,
             )
-        finally:
-            self._current_site = None
-        # flags to guarantee commutativity of condition, intervene, trace
-        msg["stop"] = True
-        msg["done"] = True
-        msg["mask"] = False
-        msg["is_observed"] = True
-        msg["infer"]["is_auxiliary"] = True
-        msg["infer"]["_do_not_trace"] = True
+            # flags to guarantee commutativity of condition, intervene, trace
+            msg["stop"] = True
+            msg["done"] = True
+            msg["mask"] = False
+            msg["is_observed"] = True
+            msg["infer"]["is_auxiliary"] = True
+            msg["infer"]["_do_not_trace"] = True
     def _pyro_post_sample(self, msg: pyro.poutine.runtime.Message) -> None:
-        infer = msg.get("infer")
-        if infer is None or "_index_naming" not in infer:
-            return
+        if typing.TYPE_CHECKING:
+            assert msg["name"] is not None
+            assert msg["value"] is not None
+            assert msg["infer"] is not None
-        # note: Pyro uses a TypedDict for infer, so it doesn't know we've stored this key
-        naming = infer["_index_naming"]  # type: ignore
+        # If there is no shim status, assume that we are looking at a guide sample.
+        # In this case, we should handle the sample and claim it as ours if we have naming
+        # information for it.
+        if "pyro_shim_status" not in msg["infer"]:
+            # Except, of course, for subsample messages, which we should ignore.
+            if (
+                pyro.poutine.util.site_is_subsample(msg)
+                or msg["name"] not in self._index_naming
+            ):
+                return
+            msg["infer"]["pyro_shim_status"] = (id(self), 1)  # type: ignore
+        # If this message has been handled already by a different pyro shim, ignore.
+        handler_id, handler_stage = msg["infer"]["pyro_shim_status"]  # type: ignore
+        if handler_id != id(self) or handler_stage < 1:
+            return
         value = msg["value"]
-        if value is not None:
-            # note: is it safe to assume that msg['fn'] is a distribution?
-            assert isinstance(
-                msg["fn"], pyro.distributions.torch_distribution.TorchDistribution
-            )
-            dist_shape: tuple[int, ...] = msg["fn"].batch_shape + msg["fn"].event_shape
-            if len(value.shape) < len(dist_shape):
-                value = value.broadcast_to(
-                    torch.broadcast_shapes(value.shape, dist_shape)
-                )
-            value = naming.apply(value)
-            msg["value"] = value
+        naming = self._index_naming.get(msg["name"], Naming({}))
+        infer = msg["infer"] if msg["infer"] is not None else {}
+        assert "enumerate" not in infer or len(naming.name_to_dim) == 0, (
+            "Enumeration is not currently supported in PyroShim."
+        )
+        # note: is it safe to assume that msg['fn'] is a distribution?
+        dist_shape: tuple[int, ...] = msg["fn"].batch_shape + msg["fn"].event_shape  # type: ignore
+        if len(value.shape) < len(dist_shape):
+            value = value.broadcast_to(torch.broadcast_shapes(value.shape, dist_shape))
-class Naming:
-    """
-    A mapping from dimensions (indexed from the right) to names.
-    """
+        value = naming.apply(value)
+        msg["value"] = value
-    def __init__(self, name_to_dim: Mapping[Operation[[], int], int]):
-        assert all(v < 0 for v in name_to_dim.values())
-        self.name_to_dim = name_to_dim
-    @staticmethod
-    def from_shape(names: Collection[Operation[[], int]], event_dims: int) -> "Naming":
-        """Create a naming from a set of indices and the number of event dimensions.
+PyroDistribution = (
+    pyro.distributions.torch_distribution.TorchDistribution
+    | pyro.distributions.torch_distribution.TorchDistributionMixin
+)
-        The resulting naming converts tensors of shape
-        ``| batch_shape | named | event_shape |``
-        to tensors of shape ``| batch_shape | event_shape |, | named |``.
-        """
-        assert event_dims >= 0
-        return Naming({n: -event_dims - len(names) + i for i, n in enumerate(names)})
+@unbind_dims.register(pyro.distributions.torch_distribution.TorchDistribution)  # type: ignore
+@unbind_dims.register(pyro.distributions.torch_distribution.TorchDistributionMixin)  # type: ignore
+def _unbind_dims_distribution(
+    value: pyro.distributions.torch_distribution.TorchDistribution,
+    *names: Operation[[], torch.Tensor],
+) -> pyro.distributions.torch_distribution.TorchDistribution:
+    d = value
+    batch_shape = None
-    def apply(self, value: torch.Tensor) -> torch.Tensor:
-        indexes: List[Any] = [slice(None)] * (len(value.shape))
-        for n, d in self.name_to_dim.items():
-            indexes[len(value.shape) + d] = n()
-        return Indexable(value)[tuple(indexes)]
+    def _validate_batch_shape(t):
+        nonlocal batch_shape
+        if len(t.shape) < len(names):
+            raise ValueError(
+                "All tensors must have at least as many dimensions as names"
+            )
-    def __repr__(self):
-        return f"Naming({self.name_to_dim})"
+        if batch_shape is None:
+            batch_shape = t.shape[: len(names)]
+        if (
+            len(t.shape) < len(batch_shape)
+            or t.shape[: len(batch_shape)] != batch_shape
+        ):
+            raise ValueError("All tensors must have the same batch shape.")
+    def _to_named(a):
+        nonlocal batch_shape
+        if isinstance(a, torch.Tensor):
+            _validate_batch_shape(a)
+            return typing.cast(torch.Tensor, a)[tuple(n() for n in names)]
+        elif isinstance(a, TorchDistribution):
+            return unbind_dims(a, *names)
+        else:
+            return a
+    # Convert to a term in a context that does not evaluate distribution constructors.
+    def _apply(op, *args, **kwargs):
+        typ = op.__type_rule__(*args, **kwargs)
+        if issubclass(
+            typ, pyro.distributions.torch_distribution.TorchDistribution
+        ) or issubclass(
+            typ, pyro.distributions.torch_distribution.TorchDistributionMixin
+        ):
+            return defdata(op, *args, **kwargs)
+        return op.__default_rule__(*args, **kwargs)
+    with runner({apply: _apply}):
+        d = defterm(d)
+    if not (isinstance(d, Term) and typeof(d) is TorchDistribution):
+        raise NotHandled
+    new_d = d.op(
+        *[_to_named(a) for a in d.args],
+        **{k: _to_named(v) for (k, v) in d.kwargs.items()},
+    )
+    assert new_d.event_shape == d.event_shape
+    return new_d
+@bind_dims.register(pyro.distributions.torch_distribution.TorchDistribution)  # type: ignore
+@bind_dims.register(pyro.distributions.torch_distribution.TorchDistributionMixin)  # type: ignore
+def _bind_dims_distribution(
+    value: pyro.distributions.torch_distribution.TorchDistribution,
+    *names: Operation[[], torch.Tensor],
+) -> pyro.distributions.torch_distribution.TorchDistribution:
+    d = value
+    def _to_positional(a, indices):
+        if isinstance(a, torch.Tensor):
+            # broadcast to full indexed shape
+            existing_dims = set(sizesof(a).keys())
+            missing_dims = set(indices) - existing_dims
+            a_indexed = torch.broadcast_to(
+                a, torch.Size([indices[dim] for dim in missing_dims]) + a.shape
+            )[tuple(n() for n in missing_dims)]
+            return bind_dims(a_indexed, *names)
+        elif isinstance(a, TorchDistribution):
+            return bind_dims(a, *names)
+        else:
+            return a
+    # Convert to a term in a context that does not evaluate distribution constructors.
+    def _apply(op, *args, **kwargs):
+        typ = op.__type_rule__(*args, **kwargs)
+        if issubclass(
+            typ, pyro.distributions.torch_distribution.TorchDistribution
+        ) or issubclass(
+            typ, pyro.distributions.torch_distribution.TorchDistributionMixin
+        ):
+            return defdata(op, *args, **kwargs)
+        return op.__default_rule__(*args, **kwargs)
-class PositionalDistribution(pyro.distributions.torch_distribution.TorchDistribution):
-    """A distribution wrapper that lazily converts indexed dimensions to
-    positional.
+    with runner({apply: _apply}):
+        d = defterm(d)
-    """
+    if not (isinstance(d, Term) and typeof(d) is TorchDistribution):
+        raise NotHandled
-    indices: Mapping[Operation[[], int], int]
+    sizes = sizesof(d)
+    indices = {k: sizes[k] for k in names}
-    def __init__(
-        self, base_dist: pyro.distributions.torch_distribution.TorchDistribution
-    ):
-        self.base_dist = base_dist
-        self.indices = sizesof(base_dist.sample())
+    pos_args = [_to_positional(a, indices) for a in d.args]
+    pos_kwargs = {k: _to_positional(v, indices) for (k, v) in d.kwargs.items()}
+    new_d = d.op(*pos_args, **pos_kwargs)
-        n_base = len(base_dist.batch_shape) + len(base_dist.event_shape)
-        self.naming = Naming.from_shape(self.indices.keys(), n_base)
+    assert new_d.event_shape == d.event_shape
+    return new_d
-        super().__init__()
-    def _to_positional(self, value: torch.Tensor) -> torch.Tensor:
-        # self.base_dist has shape: | batch_shape | event_shape | & named
-        # assume value comes from base_dist with shape:
-        # | sample_shape | batch_shape | event_shape | & named
-        # return a tensor of shape | sample_shape | named | batch_shape | event_shape |
-        n_named = len(self.indices)
-        dims = list(range(n_named + len(value.shape)))
+@functools.cache
+def _register_distribution_op(
+    dist_constr: type[TorchDistribution],
+) -> Operation[Any, TorchDistribution]:
+    # introduce a wrapper so that we can control type annotations
+    def wrapper(*args, **kwargs) -> TorchDistribution:
+        return dist_constr(*args, **kwargs)
-        n_base = len(self.event_shape) + len(self.base_dist.batch_shape)
-        n_sample = len(value.shape) - n_base
+    return defop(wrapper)
-        base_dims = dims[len(dims) - n_base :]
-        named_dims = dims[:n_named]
-        sample_dims = dims[n_named : n_named + n_sample]
-        # shape: | named | sample_shape | batch_shape | event_shape |
-        # TODO: replace with something more efficient
-        pos_tensor = to_tensor(value, self.indices.keys())
+@defdata.register(pyro.distributions.torch_distribution.TorchDistribution)
+@defdata.register(pyro.distributions.torch_distribution.TorchDistributionMixin)
+class _DistributionTerm(Term[TorchDistribution], TorchDistribution):
+    """A distribution wrapper that satisfies the Term interface.
-        # shape: | sample_shape | named | batch_shape | event_shape |
-        pos_tensor_r = torch.permute(pos_tensor, sample_dims + named_dims + base_dims)
+    Represented as a term of the form call(D, *args, **kwargs) where D is the
+    distribution constructor.
-        return pos_tensor_r
+    Note: When we construct instances of this class, we put distribution
+    parameters that can be expanded in the args list and those that cannot in
+    the kwargs list.
-    def _from_positional(self, value: torch.Tensor) -> torch.Tensor:
-        # maximal value shape: | sample_shape | named | batch_shape | event_shape |
-        return self.naming.apply(value)
+    """
+    _op: Operation[Any, TorchDistribution]
+    _args: tuple
+    _kwargs: dict
+    def __init__(self, op: Operation[Any, TorchDistribution], *args, **kwargs):
+        self._op = op
+        self._args = tuple(defterm(a) for a in args)
+        self._kwargs = {k: defterm(v) for (k, v) in kwargs.items()}
+    @property
+    def op(self):
+        return self._op
+    @property
+    def args(self):
+        return self._args
+    @property
+    def kwargs(self):
+        return self._kwargs
+    @property
+    def _base_dist(self):
+        return self._op(*self.args, **self.kwargs)
     @property
     def has_rsample(self):
-        return self.base_dist.has_rsample
+        return self._base_dist.has_rsample
     @property
     def batch_shape(self):
-        return (
-            torch.Size([s for s in self.indices.values()]) + self.base_dist.batch_shape
-        )
+        return self._base_dist.batch_shape
     @property
     def event_shape(self):
-        return self.base_dist.event_shape
+        return self._base_dist.event_shape
     @property
     def has_enumerate_support(self):
-        return self.base_dist.has_enumerate_support
+        return self._base_dist.has_enumerate_support
     @property
     def arg_constraints(self):
-        return self.base_dist.arg_constraints
+        return self._base_dist.arg_constraints
     @property
     def support(self):
-        return self.base_dist.support
-    def __repr__(self):
-        return f"PositionalDistribution({self.base_dist})"
+        return self._base_dist.support
     def sample(self, sample_shape=torch.Size()):
-        return self._to_positional(self.base_dist.sample(sample_shape))
+        return self._base_dist.sample(sample_shape)
     def rsample(self, sample_shape=torch.Size()):
-        return self._to_positional(self.base_dist.rsample(sample_shape))
+        return self._base_dist.rsample(sample_shape)
     def log_prob(self, value):
-        return self._to_positional(
-            self.base_dist.log_prob(self._from_positional(value))
-        )
+        return self._base_dist.log_prob(value)
     def enumerate_support(self, expand=True):
-        return self._to_positional(self.base_dist.enumerate_support(expand))
+        return self._base_dist.enumerate_support(expand)
-class NamedDistribution(pyro.distributions.torch_distribution.TorchDistribution):
-    """A distribution wrapper that lazily names leftmost dimensions."""
+@defterm.register(TorchDistribution)
+@defterm.register(TorchDistributionMixin)
+def _embed_distribution(dist: TorchDistribution) -> Term[TorchDistribution]:
+    raise ValueError(
+        f"No embedding provided for distribution of type {type(dist).__name__}."
+    )
-    def __init__(
-        self,
-        base_dist: pyro.distributions.torch_distribution.TorchDistribution,
-        names: Collection[Operation[[], int]],
-    ):
-        """
-        :param base_dist: A distribution with batch dimensions.
-        :param names: A list of names.
+@defterm.register
+def _embed_expanded(d: dist.ExpandedDistribution) -> Term[TorchDistribution]:
+    with interpreter({}):
+        batch_shape = d._batch_shape
+        base_dist = d.base_dist
+        base_batch_shape = base_dist.batch_shape
+        if batch_shape == base_batch_shape:
+            return base_dist
-        """
-        self.base_dist = base_dist
-        self.names = names
+    raise ValueError("Nontrivial ExpandedDistribution not implemented.")
-        assert 1 <= len(names) <= len(base_dist.batch_shape)
-        base_indices = sizesof(base_dist.sample())
-        assert not any(n in base_indices for n in names)
-        n_base = len(base_dist.batch_shape) + len(base_dist.event_shape)
-        self.naming = Naming.from_shape(names, n_base - len(names))
-        super().__init__()
+@defterm.register
+def _embed_independent(d: dist.Independent) -> Term[TorchDistribution]:
+    with interpreter({}):
+        base_dist = d.base_dist
+        reinterpreted_batch_ndims = d.reinterpreted_batch_ndims
-    def _to_named(self, value: torch.Tensor, offset=0) -> torch.Tensor:
-        return self.naming.apply(value)
+    return _register_distribution_op(type(d))(base_dist, reinterpreted_batch_ndims)
-    def _from_named(self, value: torch.Tensor) -> torch.Tensor:
-        pos_value = to_tensor(value, self.names)
-        dims = list(range(len(pos_value.shape)))
+@defterm.register
+def _embed_folded(d: dist.FoldedDistribution) -> Term[TorchDistribution]:
+    with interpreter({}):
+        base_dist = d.base_dist
-        n_base = len(self.event_shape) + len(self.batch_shape)
-        n_named = len(self.names)
-        n_sample = len(pos_value.shape) - n_base - n_named
+    return _register_distribution_op(type(d))(base_dist)  # type: ignore
-        base_dims = dims[len(dims) - n_base :]
-        named_dims = dims[:n_named]
-        sample_dims = dims[n_named : n_named + n_sample]
-        pos_tensor_r = torch.permute(pos_value, sample_dims + named_dims + base_dims)
+@defterm.register
+def _embed_masked(d: dist.MaskedDistribution) -> Term[TorchDistribution]:
+    with interpreter({}):
+        base_dist = d.base_dist
+        mask = d._mask
-        return pos_tensor_r
+    return _register_distribution_op(type(d))(base_dist, mask)
-    @property
-    def has_rsample(self):
-        return self.base_dist.has_rsample
-    @property
-    def batch_shape(self):
-        return self.base_dist.batch_shape[len(self.names) :]
+@defterm.register(dist.Cauchy)
+@defterm.register(dist.Gumbel)
+@defterm.register(dist.Laplace)
+@defterm.register(dist.LogNormal)
+@defterm.register(dist.Logistic)
+@defterm.register(dist.LogisticNormal)
+@defterm.register(dist.Normal)
+@defterm.register(dist.StudentT)
+def _embed_loc_scale(d: TorchDistribution) -> Term[TorchDistribution]:
+    with interpreter({}):
+        loc = d.loc
+        scale = d.scale
-    @property
-    def event_shape(self):
-        return self.base_dist.event_shape
+    return _register_distribution_op(type(d))(loc, scale)
-    @property
-    def has_enumerate_support(self):
-        return self.base_dist.has_enumerate_support
-    @property
-    def arg_constraints(self):
-        return self.base_dist.arg_constraints
+@defterm.register(dist.Bernoulli)
+@defterm.register(dist.Categorical)
+@defterm.register(dist.ContinuousBernoulli)
+@defterm.register(dist.Geometric)
+@defterm.register(dist.OneHotCategorical)
+@defterm.register(dist.OneHotCategoricalStraightThrough)
+def _embed_probs(d: TorchDistribution) -> Term[TorchDistribution]:
+    with interpreter({}):
+        probs = d.probs
-    @property
-    def support(self):
-        return self.base_dist.support
+    return _register_distribution_op(type(d))(probs)
-    def __repr__(self):
-        return f"NamedDistribution({self.base_dist}, {self.names})"
-    def sample(self, sample_shape=torch.Size()):
-        t = self._to_named(
-            self.base_dist.sample(sample_shape), offset=len(sample_shape)
-        )
-        assert set(sizesof(t).keys()) == set(self.names)
-        assert t.shape == self.shape() + sample_shape
-        return t
+@defterm.register(dist.Beta)
+@defterm.register(dist.Kumaraswamy)
+def _embed_beta(d: TorchDistribution) -> Term[TorchDistribution]:
+    with interpreter({}):
+        concentration1 = d.concentration1
+        concentration0 = d.concentration0
-    def rsample(self, sample_shape=torch.Size()):
-        return self._to_named(
-            self.base_dist.rsample(sample_shape), offset=len(sample_shape)
-        )
+    return _register_distribution_op(type(d))(concentration1, concentration0)
-    def log_prob(self, value):
-        v1 = self._from_named(value)
-        v2 = self.base_dist.log_prob(v1)
-        v3 = self._to_named(v2)
-        return v3
-    def enumerate_support(self, expand=True):
-        return self._to_named(self.base_dist.enumerate_support(expand))
+@defterm.register
+def _embed_binomial(d: dist.Binomial) -> Term[TorchDistribution]:
+    with interpreter({}):
+        total_count = d.total_count
+        probs = d.probs
+    return _register_distribution_op(dist.Binomial)(total_count, probs)
+@defterm.register
+def _embed_chi2(d: dist.Chi2) -> Term[TorchDistribution]:
+    with interpreter({}):
+        df = d.df
+    return _register_distribution_op(dist.Chi2)(df)
+@defterm.register
+def _embed_dirichlet(d: dist.Dirichlet) -> Term[TorchDistribution]:
+    with interpreter({}):
+        concentration = d.concentration
+    return _register_distribution_op(dist.Dirichlet)(concentration)
+@defterm.register
+def _embed_exponential(d: dist.Exponential) -> Term[TorchDistribution]:
+    with interpreter({}):
+        rate = d.rate
+    return _register_distribution_op(dist.Exponential)(rate)
+@defterm.register
+def _embed_fisher_snedecor(d: dist.FisherSnedecor) -> Term[TorchDistribution]:
+    with interpreter({}):
+        df1 = d.df1
+        df2 = d.df2
+    return _register_distribution_op(dist.FisherSnedecor)(df1, df2)
+@defterm.register
+def _embed_gamma(d: dist.Gamma) -> Term[TorchDistribution]:
+    with interpreter({}):
+        concentration = d.concentration
+        rate = d.rate
+    return _register_distribution_op(dist.Gamma)(concentration, rate)
+@defterm.register(dist.HalfCauchy)
+@defterm.register(dist.HalfNormal)
+def _embed_half_cauchy(d: TorchDistribution) -> Term[TorchDistribution]:
+    with interpreter({}):
+        scale = d.scale
+    return _register_distribution_op(type(d))(scale)
+@defterm.register
+def _embed_lkj_cholesky(d: dist.LKJCholesky) -> Term[TorchDistribution]:
+    with interpreter({}):
+        dim = d.dim
+        concentration = d.concentration
+    return _register_distribution_op(dist.LKJCholesky)(dim, concentration=concentration)
+@defterm.register
+def _embed_multinomial(d: dist.Multinomial) -> Term[TorchDistribution]:
+    with interpreter({}):
+        total_count = d.total_count
+        probs = d.probs
+    return _register_distribution_op(dist.Multinomial)(total_count, probs)
+@defterm.register
+def _embed_multivariate_normal(d: dist.MultivariateNormal) -> Term[TorchDistribution]:
+    with interpreter({}):
+        loc = d.loc
+        scale_tril = d.scale_tril
+    return _register_distribution_op(dist.MultivariateNormal)(
+        loc, scale_tril=scale_tril
+    )
+@defterm.register
+def _embed_negative_binomial(d: dist.NegativeBinomial) -> Term[TorchDistribution]:
+    with interpreter({}):
+        total_count = d.total_count
+        probs = d.probs
+    return _register_distribution_op(dist.NegativeBinomial)(total_count, probs)
+@defterm.register
+def _embed_pareto(d: dist.Pareto) -> Term[TorchDistribution]:
+    with interpreter({}):
+        scale = d.scale
+        alpha = d.alpha
+    return _register_distribution_op(dist.Pareto)(scale, alpha)
+@defterm.register
+def _embed_poisson(d: dist.Poisson) -> Term[TorchDistribution]:
+    with interpreter({}):
+        rate = d.rate
+    return _register_distribution_op(dist.Poisson)(rate)
+@defterm.register(dist.RelaxedBernoulli)
+@defterm.register(dist.RelaxedOneHotCategorical)
+def _embed_relaxed(d: TorchDistribution) -> Term[TorchDistribution]:
+    with interpreter({}):
+        temperature = d.temperature
+        probs = d.probs
+    return _register_distribution_op(type(d))(temperature, probs)
+@defterm.register
+def _embed_uniform(d: dist.Uniform) -> Term[TorchDistribution]:
+    with interpreter({}):
+        low = d.low
+        high = d.high
+    return _register_distribution_op(dist.Uniform)(low, high)
+@defterm.register
+def _embed_von_mises(d: dist.VonMises) -> Term[TorchDistribution]:
+    with interpreter({}):
+        loc = d.loc
+        concentration = d.concentration
+    return _register_distribution_op(dist.VonMises)(loc, concentration)
+@defterm.register
+def _embed_weibull(d: dist.Weibull) -> Term[TorchDistribution]:
+    with interpreter({}):
+        scale = d.scale
+        concentration = d.concentration
+    return _register_distribution_op(dist.Weibull)(scale, concentration)
+@defterm.register
+def _embed_wishart(d: dist.Wishart) -> Term[TorchDistribution]:
+    with interpreter({}):
+        df = d.df
+        scale_tril = d.scale_tril
+    return _register_distribution_op(dist.Wishart)(df, scale_tril)
+@defterm.register
+def _embed_delta(d: dist.Delta) -> Term[TorchDistribution]:
+    with interpreter({}):
+        v = d.v
+        log_density = d.log_density
+        event_dim = d.event_dim
+    return _register_distribution_op(dist.Delta)(
+        v, log_density=log_density, event_dim=event_dim
+    )
 def pyro_module_shim(

effectful 0.0.1__py3-none-any.whl → 0.2.0__py3-none-any.whl

effectful 0.0.1py3-none-any.whl → 0.2.0py3-none-any.whl