PyPI - qpytorch - Versions diffs - 0.1__py3-none-any.whl - Mend

qpytorch 0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of qpytorch might be problematic. Click here for more details.

Files changed (102) hide show

qpytorch/__init__.py +327 -0
qpytorch/constraints/__init__.py +3 -0
qpytorch/distributions/__init__.py +21 -0
qpytorch/distributions/delta.py +86 -0
qpytorch/distributions/multitask_multivariate_qexponential.py +435 -0
qpytorch/distributions/multivariate_qexponential.py +581 -0
qpytorch/distributions/power.py +113 -0
qpytorch/distributions/qexponential.py +153 -0
qpytorch/functions/__init__.py +58 -0
qpytorch/kernels/__init__.py +80 -0
qpytorch/kernels/grid_interpolation_kernel.py +213 -0
qpytorch/kernels/inducing_point_kernel.py +151 -0
qpytorch/kernels/kernel.py +695 -0
qpytorch/kernels/matern32_kernel_grad.py +155 -0
qpytorch/kernels/matern52_kernel_grad.py +194 -0
qpytorch/kernels/matern52_kernel_gradgrad.py +248 -0
qpytorch/kernels/polynomial_kernel_grad.py +88 -0
qpytorch/kernels/qexponential_symmetrized_kl_kernel.py +61 -0
qpytorch/kernels/rbf_kernel_grad.py +125 -0
qpytorch/kernels/rbf_kernel_gradgrad.py +186 -0
qpytorch/kernels/rff_kernel.py +153 -0
qpytorch/lazy/__init__.py +9 -0
qpytorch/likelihoods/__init__.py +66 -0
qpytorch/likelihoods/bernoulli_likelihood.py +75 -0
qpytorch/likelihoods/beta_likelihood.py +76 -0
qpytorch/likelihoods/gaussian_likelihood.py +472 -0
qpytorch/likelihoods/laplace_likelihood.py +59 -0
qpytorch/likelihoods/likelihood.py +437 -0
qpytorch/likelihoods/likelihood_list.py +60 -0
qpytorch/likelihoods/multitask_gaussian_likelihood.py +542 -0
qpytorch/likelihoods/multitask_qexponential_likelihood.py +545 -0
qpytorch/likelihoods/noise_models.py +184 -0
qpytorch/likelihoods/qexponential_likelihood.py +494 -0
qpytorch/likelihoods/softmax_likelihood.py +97 -0
qpytorch/likelihoods/student_t_likelihood.py +90 -0
qpytorch/means/__init__.py +23 -0
qpytorch/metrics/__init__.py +17 -0
qpytorch/mlls/__init__.py +53 -0
qpytorch/mlls/_approximate_mll.py +79 -0
qpytorch/mlls/deep_approximate_mll.py +30 -0
qpytorch/mlls/deep_predictive_log_likelihood.py +32 -0
qpytorch/mlls/exact_marginal_log_likelihood.py +96 -0
qpytorch/mlls/gamma_robust_variational_elbo.py +106 -0
qpytorch/mlls/inducing_point_kernel_added_loss_term.py +69 -0
qpytorch/mlls/kl_qexponential_added_loss_term.py +41 -0
qpytorch/mlls/leave_one_out_pseudo_likelihood.py +73 -0
qpytorch/mlls/marginal_log_likelihood.py +48 -0
qpytorch/mlls/predictive_log_likelihood.py +76 -0
qpytorch/mlls/sum_marginal_log_likelihood.py +40 -0
qpytorch/mlls/variational_elbo.py +77 -0
qpytorch/models/__init__.py +72 -0
qpytorch/models/approximate_qep.py +115 -0
qpytorch/models/deep_qeps/__init__.py +22 -0
qpytorch/models/deep_qeps/deep_qep.py +155 -0
qpytorch/models/deep_qeps/dspp.py +114 -0
qpytorch/models/exact_prediction_strategies.py +880 -0
qpytorch/models/exact_qep.py +349 -0
qpytorch/models/model_list.py +100 -0
qpytorch/models/pyro/__init__.py +28 -0
qpytorch/models/pyro/_pyro_mixin.py +57 -0
qpytorch/models/pyro/distributions/__init__.py +5 -0
qpytorch/models/pyro/pyro_qep.py +105 -0
qpytorch/models/qep.py +7 -0
qpytorch/models/qeplvm/__init__.py +6 -0
qpytorch/models/qeplvm/bayesian_qeplvm.py +40 -0
qpytorch/models/qeplvm/latent_variable.py +102 -0
qpytorch/module.py +30 -0
qpytorch/optim/__init__.py +5 -0
qpytorch/priors/__init__.py +42 -0
qpytorch/priors/qep_priors.py +81 -0
qpytorch/test/__init__.py +22 -0
qpytorch/test/base_likelihood_test_case.py +106 -0
qpytorch/test/model_test_case.py +150 -0
qpytorch/test/variational_test_case.py +400 -0
qpytorch/utils/__init__.py +38 -0
qpytorch/utils/warnings.py +37 -0
qpytorch/variational/__init__.py +47 -0
qpytorch/variational/_variational_distribution.py +61 -0
qpytorch/variational/_variational_strategy.py +391 -0
qpytorch/variational/additive_grid_interpolation_variational_strategy.py +90 -0
qpytorch/variational/batch_decoupled_variational_strategy.py +256 -0
qpytorch/variational/cholesky_variational_distribution.py +65 -0
qpytorch/variational/ciq_variational_strategy.py +352 -0
qpytorch/variational/delta_variational_distribution.py +41 -0
qpytorch/variational/grid_interpolation_variational_strategy.py +113 -0
qpytorch/variational/independent_multitask_variational_strategy.py +114 -0
qpytorch/variational/lmc_variational_strategy.py +248 -0
qpytorch/variational/mean_field_variational_distribution.py +58 -0
qpytorch/variational/multitask_variational_strategy.py +317 -0
qpytorch/variational/natural_variational_distribution.py +152 -0
qpytorch/variational/nearest_neighbor_variational_strategy.py +487 -0
qpytorch/variational/orthogonally_decoupled_variational_strategy.py +128 -0
qpytorch/variational/tril_natural_variational_distribution.py +130 -0
qpytorch/variational/uncorrelated_multitask_variational_strategy.py +114 -0
qpytorch/variational/unwhitened_variational_strategy.py +225 -0
qpytorch/variational/variational_strategy.py +280 -0
qpytorch/version.py +4 -0
qpytorch-0.1.dist-info/LICENSE +21 -0
qpytorch-0.1.dist-info/METADATA +177 -0
qpytorch-0.1.dist-info/RECORD +102 -0
qpytorch-0.1.dist-info/WHEEL +5 -0
qpytorch-0.1.dist-info/top_level.txt +1 -0

qpytorch/__init__.py ADDED Viewed

@@ -0,0 +1,327 @@
+#!/usr/bin/env python3
+from typing import Optional, Tuple, Union
+import linear_operator
+import torch
+from linear_operator import LinearOperator
+from torch import Tensor
+from gpytorch import (
+    beta_features,
+    settings,
+)
+from . import (
+    distributions,
+    kernels,
+    lazy,
+    likelihoods,
+    means,
+    metrics,
+    mlls,
+    models,
+    optim,
+    priors,
+    utils,
+    variational,
+)
+from .functions import inv_matmul, log_normal_cdf, logdet, matmul  # Deprecated
+from .mlls import ExactMarginalLogLikelihood
+from gpytorch.module import Module
+Anysor = Union[LinearOperator, Tensor]
+def add_diagonal(input: Anysor, diag: Tensor) -> LinearOperator:
+    r"""
+    Adds an element to the diagonal of the matrix :math:`\mathbf A`.
+    :param input: The matrix (or batch of matrices) :math:`\mathbf A` (... x N x N).
+    :param diag: Diagonal to add
+    :return: :math:`\mathbf A + \text{diag}(\mathbf d)`, where :math:`\mathbf A` is the linear operator
+        and :math:`\mathbf d` is the diagonal component
+    """
+    return linear_operator.add_diagonal(input=input, diag=diag)
+def add_jitter(input: Anysor, jitter_val: float = 1e-3) -> Anysor:
+    r"""
+    Adds jitter (i.e., a small diagonal component) to the matrix this
+    LinearOperator represents.
+    This is equivalent to calling :meth:`~linear_operator.operators.LinearOperator.add_diagonal`
+    with a scalar tensor.
+    :param input: The matrix (or batch of matrices) :math:`\mathbf A` (... x N x N).
+    :param jitter_val: The diagonal component to add
+    :return: :math:`\mathbf A + \alpha (\mathbf I)`, where :math:`\mathbf A` is the linear operator
+        and :math:`\alpha` is :attr:`jitter_val`.
+    """
+    return linear_operator.add_jitter(input=input, jitter_val=jitter_val)
+def diagonalization(input: Anysor, method: Optional[str] = None) -> Tuple[Tensor, Tensor]:
+    r"""
+    Returns a (usually partial) diagonalization of a symmetric positive definite matrix (or batch of matrices).
+    :math:`\mathbf A`.
+    Options are either "lanczos" or "symeig". "lanczos" runs Lanczos while
+    "symeig" runs LinearOperator.symeig.
+    :param input: The matrix (or batch of matrices) :math:`\mathbf A` (... x N x N).
+    :param method: Specify the method to use ("lanczos" or "symeig"). The method will be determined
+        based on size if not specified.
+    :return: eigenvalues and eigenvectors representing the diagonalization.
+    """
+    return linear_operator.diagonalization(input=input, method=method)
+def dsmm(
+    sparse_mat: Union[torch.sparse.HalfTensor, torch.sparse.FloatTensor, torch.sparse.DoubleTensor],
+    dense_mat: Tensor,
+) -> Tensor:
+    r"""
+    Performs the (batch) matrix multiplication :math:`\mathbf{SD}`
+    where :math:`\mathbf S` is a sparse matrix and :math:`\mathbf D` is a dense matrix.
+    :param sparse_mat: Sparse matrix :math:`\mathbf S` (... x M x N)
+    :param dense_mat: Dense matrix :math:`\mathbf D` (... x N x O)
+    :return: :math:`\mathbf S \mathbf D` (... x M x N)
+    """
+    return linear_operator.dsmm(sparse_mat=sparse_mat, dense_mat=dense_mat)
+def inv_quad(input: Anysor, inv_quad_rhs: Tensor, reduce_inv_quad: bool = True) -> Tensor:
+    r"""
+    Computes an inverse quadratic form (w.r.t self) with several right hand sides, i.e:
+    .. math::
+       \text{tr}\left( \mathbf R^\top \mathbf A^{-1} \mathbf R \right),
+    where :math:`\mathbf A` is a positive definite matrix (or batch of matrices) and :math:`\mathbf R`
+    represents the right hand sides (:attr:`inv_quad_rhs`).
+    If :attr:`reduce_inv_quad` is set to false (and :attr:`inv_quad_rhs` is supplied),
+    the function instead computes
+    .. math::
+       \text{diag}\left( \mathbf R^\top \mathbf A^{-1} \mathbf R \right).
+    :param input: :math:`\mathbf A` - the positive definite matrix (... X N X N)
+    :param inv_quad_rhs: :math:`\mathbf R` - the right hand sides of the inverse quadratic term (... x N x M)
+    :param reduce_inv_quad: Whether to compute
+        :math:`\text{tr}\left( \mathbf R^\top \mathbf A^{-1} \mathbf R \right)`
+        or :math:`\text{diag}\left( \mathbf R^\top \mathbf A^{-1} \mathbf R \right)`.
+    :returns: The inverse quadratic term.
+        If `reduce_inv_quad=True`, the inverse quadratic term is of shape (...). Otherwise, it is (... x M).
+    """
+    return linear_operator.inv_quad(input=input, inv_quad_rhs=inv_quad_rhs, reduce_inv_quad=reduce_inv_quad)
+def inv_quad_logdet(
+    input: Anysor,
+    inv_quad_rhs: Optional[Tensor] = None,
+    logdet: bool = False,
+    reduce_inv_quad: bool = True,
+) -> Tuple[Tensor, Tensor]:
+    r"""
+    Calls both :func:`inv_quad_logdet` and :func:`logdet` on a positive definite matrix (or batch) :math:`\mathbf A`.
+    However, calling this method is far more efficient and stable than calling each method independently.
+    :param input: :math:`\mathbf A` - the positive definite matrix (... X N X N)
+    :param inv_quad_rhs: :math:`\mathbf R` - the right hand sides of the inverse quadratic term (... x N x M)
+    :param logdet: Whether or not to compute the
+        logdet term :math:`\log \vert \mathbf A \vert`.
+    :param reduce_inv_quad: Whether to compute
+        :math:`\text{tr}\left( \mathbf R^\top \mathbf A^{-1} \mathbf R \right)`
+        or :math:`\text{diag}\left( \mathbf R^\top \mathbf A^{-1} \mathbf R \right)`.
+    :returns: The inverse quadratic term (or None), and the logdet term (or None).
+        If `reduce_inv_quad=True`, the inverse quadratic term is of shape (...). Otherwise, it is (... x M).
+    """
+    return linear_operator.inv_quad_logdet(
+        input=input,
+        inv_quad_rhs=inv_quad_rhs,
+        logdet=logdet,
+        reduce_inv_quad=reduce_inv_quad,
+    )
+def pivoted_cholesky(
+    input: Anysor,
+    rank: int,
+    error_tol: Optional[float] = None,
+    return_pivots: bool = False,
+) -> Union[Tensor, Tuple[Tensor, Tensor]]:
+    r"""
+    Performs a partial pivoted Cholesky factorization of a positive definite matrix (or batch of matrices).
+    :math:`\mathbf L \mathbf L^\top = \mathbf A`.
+    The partial pivoted Cholesky factor :math:`\mathbf L \in \mathbb R^{N \times \text{rank}}`
+    forms a low rank approximation to the LinearOperator.
+    The pivots are selected greedily, correspoading to the maximum diagonal element in the
+    residual after each Cholesky iteration. See `Harbrecht et al., 2012`_.
+    :param input: The matrix (or batch of matrices) :math:`\mathbf A` (... x N x N).
+    :param rank: The size of the partial pivoted Cholesky factor.
+    :param error_tol: Defines an optional stopping criterion.
+        If the residual of the factorization is less than :attr:`error_tol`, then the
+        factorization will exit early. This will result in a :math:`\leq \text{ rank}` factor.
+    :param return_pivots: Whether or not to return the pivots alongside
+        the partial pivoted Cholesky factor.
+    :return: The `... x N x rank` factor (and optionally the `... x N` pivots if :attr:`return_pivots` is True).
+    .. _Harbrecht et al., 2012:
+        https://www.sciencedirect.com/science/article/pii/S0168927411001814
+    """
+    return linear_operator.pivoted_cholesky(input=input, rank=rank, return_pivots=return_pivots)
+def root_decomposition(input: Anysor, method: Optional[str] = None) -> LinearOperator:
+    r"""
+    Returns a (usually low-rank) root decomposition linear operator of the
+    positive definite matrix (or batch of matrices) :math:`\mathbf A`.
+    This can be used for sampling from a Gaussian distribution, or for obtaining a
+    low-rank version of a matrix.
+    :param input: The matrix (or batch of matrices) :math:`\mathbf A` (... x N x N).
+    :param method: Which method to use to perform the root decomposition. Choices are:
+        "cholesky", "lanczos", "symeig", "pivoted_cholesky", or "svd".
+    :return: A tensor :math:`\mathbf R` such that :math:`\mathbf R \mathbf R^\top \approx \mathbf A`.
+    """
+    return linear_operator.root_decomposition(input=input, method=method)
+def root_inv_decomposition(
+    input: Anysor,
+    initial_vectors: Optional[Tensor] = None,
+    test_vectors: Optional[Tensor] = None,
+    method: Optional[str] = None,
+) -> LinearOperator:
+    r"""
+    Returns a (usually low-rank) inverse root decomposition linear operator
+    of the PSD LinearOperator :math:`\mathbf A`.
+    This can be used for sampling from a Gaussian distribution, or for obtaining a
+    low-rank version of a matrix.
+    The root_inv_decomposition is performed using a partial Lanczos tridiagonalization.
+    :param input: The matrix (or batch of matrices) :math:`\mathbf A` (... x N x N).
+    :param initial_vectors: Vectors used to initialize the Lanczos decomposition.
+        The best initialization vector (determined by :attr:`test_vectors`) will be chosen.
+    :param test_vectors: Vectors used to test the accuracy of the decomposition.
+    :param method: Root decomposition method to use (symeig, diagonalization, lanczos, or cholesky).
+    :return: A tensor :math:`\mathbf R` such that :math:`\mathbf R \mathbf R^\top \approx \mathbf A^{-1}`.
+    """
+    return linear_operator.root_inv_decomposition(
+        input=input,
+        initial_vectors=initial_vectors,
+        test_vectors=test_vectors,
+        method=method,
+    )
+def solve(input: Anysor, rhs: Tensor, lhs: Optional[Tensor] = None) -> Tensor:
+    r"""
+    Given a positive definite matrix (or batch of matrices) :math:`\mathbf A`,
+    computes a linear solve with right hand side :math:`\mathbf R`:
+    .. math::
+       \begin{equation}
+           \mathbf A^{-1} \mathbf R,
+       \end{equation}
+    where :math:`\mathbf R` is :attr:`right_tensor` and :math:`\mathbf A` is the LinearOperator.
+    .. note::
+        Unlike :func:`torch.linalg.solve`, this function can take an optional :attr:`left_tensor` attribute.
+        If this is supplied :func:`gpytorch.solve` computes
+        .. math::
+           \begin{equation}
+               \mathbf L \mathbf A^{-1} \mathbf R,
+           \end{equation}
+        where :math:`\mathbf L` is :attr:`left_tensor`.
+        Supplying this can reduce the number of solver calls required in the backward pass.
+    :param input: The matrix (or batch of matrices) :math:`\mathbf A` (... x N x N).
+    :param rhs: :math:`\mathbf R` - the right hand side
+    :param lhs: :math:`\mathbf L` - the left hand side
+    :return: :math:`\mathbf A^{-1} \mathbf R` or :math:`\mathbf L \mathbf A^{-1} \mathbf R`.
+    """
+    return linear_operator.solve(input=input, rhs=rhs, lhs=lhs)
+def sqrt_inv_matmul(input: Anysor, rhs: Tensor, lhs: Optional[Tensor] = None) -> Tensor:
+    r"""
+    Given a positive definite matrix (or batch of matrices) :math:`\mathbf A`
+    and a right hand size :math:`\mathbf R`,
+    computes
+    .. math::
+       \begin{equation}
+           \mathbf A^{-1/2} \mathbf R,
+       \end{equation}
+    If :attr:`lhs` is supplied, computes
+    .. math::
+       \begin{equation}
+           \mathbf L \mathbf A^{-1/2} \mathbf R,
+       \end{equation}
+    where :math:`\mathbf L` is :attr:`lhs`.
+    (Supplying :attr:`lhs` can reduce the number of solver calls required in the backward pass.)
+    :param input: The matrix (or batch of matrices) :math:`\mathbf A` (... x N x N).
+    :param rhs: :math:`\mathbf R` - the right hand side
+    :param lhs: :math:`\mathbf L` - the left hand side
+    :return: :math:`\mathbf A^{-1/2} \mathbf R` or :math:`\mathbf L \mathbf A^{-1/2} \mathbf R`.
+    """
+    return linear_operator.sqrt_inv_matmul(input=input, rhs=rhs, lhs=lhs)
+# Read version number as written by setuptools_scm
+try:
+    from qpytorch.version import version as __version__
+except Exception:  # pragma: no cover
+    __version__ = "Unknown"  # pragma: no cover
+__all__ = [
+    # Submodules
+    "distributions",
+    "kernels",
+    "lazy",
+    "likelihoods",
+    "means",
+    "metrics",
+    "mlls",
+    "models",
+    "optim",
+    "priors",
+    "utils",
+    "variational",
+    # Classes
+    "Module",
+    "ExactMarginalLogLikelihood",
+    # Functions
+    "add_diagonal",
+    "add_jitter",
+    "dsmm",
+    "inv_quad",
+    "inv_quad_logdet",
+    "pivoted_cholesky",
+    "root_decomposition",
+    "root_inv_decomposition",
+    "solve",
+    "sqrt_inv_matmul",
+    # Context managers
+    "beta_features",
+    "settings",
+    # Other
+    "__version__",
+    # Deprecated
+    "inv_matmul",
+    "logdet",
+    "log_normal_cdf",
+    "matmul",
+]

qpytorch/constraints/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+from gpytorch.constraints import GreaterThan, Interval, LessThan, Positive
+__all__ = ["GreaterThan", "Interval", "LessThan", "Positive"]

qpytorch/distributions/__init__.py ADDED Viewed

@@ -0,0 +1,21 @@
+#!/usr/bin/env python3
+from .delta import Delta
+from gpytorch.distributions.distribution import Distribution
+from .qexponential import QExponential
+from gpytorch.distributions.multivariate_normal import MultivariateNormal
+from gpytorch.distributions.multitask_multivariate_normal import MultitaskMultivariateNormal
+from .multivariate_qexponential import MultivariateQExponential
+from .multitask_multivariate_qexponential import MultitaskMultivariateQExponential
+from .power import Power
+# Get the set of distributions from either PyTorch or Pyro
+try:
+    # If pyro is installed, use that set of base distributions
+    import pyro.distributions as base_distributions
+except ImportError:
+    # Otherwise, use PyTorch
+    import torch.distributions as base_distributions
+__all__ = ["Delta", "QExponential", "Distribution", "MultivariateNormal", "MultitaskMultivariateNormal", "MultivariateQExponential", "MultitaskMultivariateQExponential", "Power", "base_distributions"]

qpytorch/distributions/delta.py ADDED Viewed

@@ -0,0 +1,86 @@
+#!/usr/bin/env python3
+import numbers
+import torch
+from torch.distributions import constraints
+from torch.distributions.kl import register_kl
+from gpytorch.distributions.distribution import Distribution
+from gpytorch.distributions.multivariate_normal import MultivariateNormal
+from .multivariate_qexponential import MultivariateQExponential
+try:
+    from pyro.distributions import Delta
+except ImportError:
+    # Mostly copied from https://github.com/pyro-ppl/pyro/blob/dev/pyro/distributions/delta.py
+    class Delta(Distribution):
+        """
+        Degenerate discrete distribution (a single point).
+        Discrete distribution that assigns probability one to the single element in
+        its support. Delta distribution parameterized by a random choice should not
+        be used with MCMC based inference, as doing so produces incorrect results.
+        :param torch.Tensor v: The single support element.
+        :param torch.Tensor log_density: An optional density for this Delta. This
+            is useful to keep the class of :class:`Delta` distributions closed
+            under differentiable transformation.
+        :param int event_dim: Optional event dimension, defaults to zero.
+        """
+        arg_constraints = {"v": constraints.real, "log_density": constraints.real}
+        has_rsample = True
+        def __init__(self, v, log_density=0.0, event_dim=0, validate_args=None):
+            if event_dim > v.dim():
+                raise ValueError("Expected event_dim <= v.dim(), actual {} vs {}".format(event_dim, v.dim()))
+            batch_dim = v.dim() - event_dim
+            batch_shape = v.shape[:batch_dim]
+            event_shape = v.shape[batch_dim:]
+            if isinstance(log_density, numbers.Number):
+                log_density = torch.full(batch_shape, log_density, dtype=v.dtype, device=v.device)
+            elif validate_args and log_density.shape != batch_shape:
+                raise ValueError("Expected log_density.shape = {}, actual {}".format(log_density.shape, batch_shape))
+            self.v = v
+            self.log_density = log_density
+            super().__init__(batch_shape, event_shape, validate_args=validate_args)
+        def expand(self, batch_shape, _instance=None):
+            new = self._get_checked_instance(Delta, _instance)
+            batch_shape = torch.Size(batch_shape)
+            new.v = self.v.expand(batch_shape + self.event_shape)
+            new.log_density = self.log_density.expand(batch_shape)
+            super().__init__(batch_shape, self.event_shape, validate_args=False)
+            new._validate_args = self._validate_args
+            return new
+        def rsample(self, sample_shape=torch.Size()):
+            shape = sample_shape + self.v.shape
+            return self.v.expand(shape)
+        def log_prob(self, x):
+            v = self.v.expand(self.batch_shape + self.event_shape)
+            log_prob = (x == v).type(x.dtype).log()
+            if len(self.event_shape):
+                log_prob = log_prob.sum(list(range(-1, -len(self.event_shape) - 1, -1)))
+            return log_prob + self.log_density
+        @property
+        def mean(self):
+            return self.v
+        @property
+        def variance(self):
+            return torch.zeros_like(self.v)
+@register_kl(Delta, MultivariateNormal)
+def kl_mvn_mvn(p_dist, q_dist):
+    return -q_dist.log_prob(p_dist.mean)
+@register_kl(Delta, MultivariateQExponential)
+def kl_qep_qep(p_dist, q_dist):
+    return -q_dist.log_prob(p_dist.mean)