PyPI - google-meridian - Versions diffs - 1.2.0__py3-none-any.whl → 1.3.0__py3-none-any.whl - Mend

google-meridian 1.2.0py3-none-any.whl → 1.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (45) hide show

{google_meridian-1.2.0.dist-info → google_meridian-1.3.0.dist-info}/METADATA +10 -10
google_meridian-1.3.0.dist-info/RECORD +62 -0
meridian/analysis/__init__.py +2 -0
meridian/analysis/analyzer.py +280 -142
meridian/analysis/formatter.py +2 -2
meridian/analysis/optimizer.py +353 -169
meridian/analysis/review/__init__.py +20 -0
meridian/analysis/review/checks.py +721 -0
meridian/analysis/review/configs.py +110 -0
meridian/analysis/review/constants.py +40 -0
meridian/analysis/review/results.py +544 -0
meridian/analysis/review/reviewer.py +186 -0
meridian/analysis/summarizer.py +14 -12
meridian/analysis/templates/chips.html.jinja +12 -0
meridian/analysis/test_utils.py +27 -5
meridian/analysis/visualizer.py +45 -50
meridian/backend/__init__.py +698 -55
meridian/backend/config.py +75 -16
meridian/backend/test_utils.py +127 -1
meridian/constants.py +52 -11
meridian/data/input_data.py +7 -2
meridian/data/test_utils.py +5 -3
meridian/mlflow/autolog.py +2 -2
meridian/model/__init__.py +1 -0
meridian/model/adstock_hill.py +10 -9
meridian/model/eda/__init__.py +3 -0
meridian/model/eda/constants.py +21 -0
meridian/model/eda/eda_engine.py +1580 -84
meridian/model/eda/eda_outcome.py +200 -0
meridian/model/eda/eda_spec.py +84 -0
meridian/model/eda/meridian_eda.py +220 -0
meridian/model/knots.py +56 -50
meridian/model/media.py +10 -8
meridian/model/model.py +79 -16
meridian/model/model_test_data.py +53 -9
meridian/model/posterior_sampler.py +398 -391
meridian/model/prior_distribution.py +114 -39
meridian/model/prior_sampler.py +146 -90
meridian/model/spec.py +7 -8
meridian/model/transformers.py +16 -8
meridian/version.py +1 -1
google_meridian-1.2.0.dist-info/RECORD +0 -52
{google_meridian-1.2.0.dist-info → google_meridian-1.3.0.dist-info}/WHEEL +0 -0
{google_meridian-1.2.0.dist-info → google_meridian-1.3.0.dist-info}/licenses/LICENSE +0 -0
{google_meridian-1.2.0.dist-info → google_meridian-1.3.0.dist-info}/top_level.txt +0 -0

meridian/model/prior_distribution.py CHANGED Viewed

@@ -19,6 +19,7 @@ used by the Meridian model object.
 """
 from __future__ import annotations
 from collections.abc import MutableMapping, Sequence
 import dataclasses
 from typing import Any
@@ -26,7 +27,6 @@ import warnings
 from meridian import backend
 from meridian import constants
 import numpy as np
@@ -34,6 +34,8 @@ __all__ = [
     'IndependentMultivariateDistribution',
     'PriorDistribution',
     'distributions_are_equal',
+    'lognormal_dist_from_mean_std',
+    'lognormal_dist_from_range',
 ]
@@ -175,14 +177,14 @@ class PriorDistribution:
     xi_n: Prior distribution on the hierarchical standard deviation of
       `gamma_gn` which is the coefficient on non-media channel `n` for geo `g`.
       Hierarchy is defined over geos. Default distribution is `HalfNormal(5.0)`.
-    alpha_m: Prior distribution on the `geometric decay` Adstock parameter for
+    alpha_m: Prior distribution on the Adstock decay parameter for media input.
+      Default distribution is `Uniform(0.0, 1.0)`.
+    alpha_rf: Prior distribution on the Adstock decay parameter for RF input.
+      Default distribution is `Uniform(0.0, 1.0)`.
+    alpha_om: Prior distribution on the Adstock decay parameter for organic
       media input. Default distribution is `Uniform(0.0, 1.0)`.
-    alpha_rf: Prior distribution on the `geometric decay` Adstock parameter for
-      RF input. Default distribution is `Uniform(0.0, 1.0)`.
-    alpha_om: Prior distribution on the `geometric decay` Adstock parameter for
-      organic media input. Default distribution is `Uniform(0.0, 1.0)`.
-    alpha_orf: Prior distribution on the `geometric decay` Adstock parameter for
-      organic RF input. Default distribution is `Uniform(0.0, 1.0)`.
+    alpha_orf: Prior distribution on the Adstock decay parameter for organic RF
+      input. Default distribution is `Uniform(0.0, 1.0)`.
     ec_m: Prior distribution on the `half-saturation` Hill parameter for media
       input. Default distribution is `TruncatedNormal(0.8, 0.8, 0.1, 10)`.
     ec_rf: Prior distribution on the `half-saturation` Hill parameter for RF
@@ -772,7 +774,7 @@ class PriorDistribution:
     )
     if (
         not isinstance(self.slope_m, backend.tfd.Deterministic)
-        or (np.isscalar(self.slope_m.loc.numpy()) and self.slope_m.loc != 1.0)
+        or (backend.rank(self.slope_m.loc) == 0 and self.slope_m.loc != 1.0)
         or (
             self.slope_m.batch_shape.as_list()
             and any(x != 1.0 for x in self.slope_m.loc)
@@ -791,7 +793,7 @@ class PriorDistribution:
     )
     if (
         not isinstance(self.slope_om, backend.tfd.Deterministic)
-        or (np.isscalar(self.slope_om.loc.numpy()) and self.slope_om.loc != 1.0)
+        or (backend.rank(self.slope_om.loc) == 0 and self.slope_om.loc != 1.0)
         or (
             self.slope_om.batch_shape.as_list()
             and any(x != 1.0 for x in self.slope_om.loc)
@@ -1000,8 +1002,7 @@ class IndependentMultivariateDistribution(backend.tfd.Distribution):
     """Check for deterministic distributions and raise an error if found."""
     if any(
-        isinstance(dist, backend.tfd.Deterministic)
-        for dist in distributions
+        isinstance(dist, backend.tfd.Deterministic) for dist in distributions
     ):
       raise ValueError(
           f'{self.__class__.__name__} cannot contain `Deterministic` '
@@ -1029,9 +1030,7 @@ class IndependentMultivariateDistribution(backend.tfd.Distribution):
         [dist.batch_shape_tensor() for dist in self._distributions],
         axis=0,
     )
-    return backend.reduce_sum(
-        distribution_batch_shape_tensors, keepdims=True
-    )
+    return backend.reduce_sum(distribution_batch_shape_tensors, keepdims=True)
   def _batch_shape(self):
     return backend.TensorShape(sum(self._distribution_batch_shapes))
@@ -1043,10 +1042,7 @@ class IndependentMultivariateDistribution(backend.tfd.Distribution):
   def _quantile(self, value):
     value = self._broadcast_value(value)
-    split_value = backend.split(
-        value,
-        self._distribution_batch_shapes, axis=-1
-        )
+    split_value = backend.split(value, self._distribution_batch_shapes, axis=-1)
     quantiles = [
         dist.quantile(sv) for dist, sv in zip(self._distributions, split_value)
     ]
@@ -1055,11 +1051,7 @@ class IndependentMultivariateDistribution(backend.tfd.Distribution):
   def _log_prob(self, value):
     value = self._broadcast_value(value)
-    split_value = backend.split(
-        value,
-        self._distribution_batch_shapes,
-        axis=-1
-        )
+    split_value = backend.split(value, self._distribution_batch_shapes, axis=-1)
     log_probs = [
         dist.log_prob(sv) for dist, sv in zip(self._distributions, split_value)
     ]
@@ -1068,11 +1060,7 @@ class IndependentMultivariateDistribution(backend.tfd.Distribution):
   def _log_cdf(self, value):
     value = self._broadcast_value(value)
-    split_value = backend.split(
-        value,
-        self._distribution_batch_shapes,
-        axis=-1
-        )
+    split_value = backend.split(value, self._distribution_batch_shapes, axis=-1)
     log_cdfs = [
         dist.log_cdf(sv) for dist, sv in zip(self._distributions, split_value)
@@ -1173,6 +1161,87 @@ def distributions_are_equal(
   return True
+def lognormal_dist_from_mean_std(
+    mean: float | Sequence[float], std: float | Sequence[float]
+) -> backend.tfd.LogNormal:
+  """Define a lognormal distribution from its mean and standard deviation.
+  This function parameterizes lognormal distributions by their mean and
+  standard deviation.
+  Args:
+    mean: A float or array-like object defining the distribution mean. Must be
+      positive.
+    std: A float or array-like object defining the distribution standard
+      deviation. Must be non-negative.
+  Returns:
+    A `backend.tfd.LogNormal` object with the input mean and standard deviation.
+  """
+  mean = np.asarray(mean)
+  std = np.asarray(std)
+  mu = np.log(mean) - 0.5 * np.log((std / mean) ** 2 + 1)
+  sigma = np.sqrt(np.log((std / mean) ** 2 + 1))
+  return backend.tfd.LogNormal(mu, sigma)
+def lognormal_dist_from_range(
+    low: float | Sequence[float],
+    high: float | Sequence[float],
+    mass_percent: float | Sequence[float] = 0.95,
+) -> backend.tfd.LogNormal:
+  """Define a LogNormal distribution from a specified range.
+  This function parameterizes lognormal distributions by the bounds of a range,
+  so that the specified probability mass falls within the bounds defined by
+  `low` and `high`. The probability mass is symmetric about the median. For
+  example, to define a lognormal distribution with a 95% probability mass of
+  (1, 10), use:
+  ```python
+  lognormal = lognormal_dist_from_range(1.0, 10.0, mass_percent=0.95)
+  ```
+  Args:
+    low: Float or array-like denoting the lower bound of the range. Values must
+      be non-negative.
+    high: Float or array-like denoting the upper bound of range. Values must be
+      non-negative.
+    mass_percent: Float or array-like denoting the probability mass. Values must
+      be between 0 and 1 (exclusive). Default: 0.95.
+  Returns:
+    A `backend.tfd.LogNormal` object with the input percentage mass falling
+      within the given range.
+  """
+  low = np.asarray(low)
+  high = np.asarray(high)
+  mass_percent = np.asarray(mass_percent)
+  if not ((0.0 < low).all() and (low < high).all()):  # pytype: disable=attribute-error
+    raise ValueError("'low' and 'high' values must be non-negative and satisfy "
+                     "high > low.")
+  if not ((0.0 < mass_percent).all() and (mass_percent < 1.0).all()):  # pytype: disable=attribute-error
+    raise ValueError(
+        "'mass_percent' values must be between 0 and 1, exclusive."
+        )
+  normal = backend.tfd.Normal(0, 1)
+  mass_lower = 0.5 - (mass_percent / 2)
+  mass_upper = 0.5 + (mass_percent / 2)
+  sigma = np.log(high / low) / (
+      normal.quantile(mass_upper) - normal.quantile(mass_lower)
+  )
+  mu = np.log(high) - normal.quantile(mass_upper) * sigma
+  return backend.tfd.LogNormal(mu, sigma)
 def _convert_to_deterministic_0_distribution(
     distribution: backend.tfd.Distribution,
 ) -> backend.tfd.Distribution:
@@ -1257,26 +1326,31 @@ def _validate_support(
   """
   # Note that `tfp.distributions.BatchBroadcast` objects have a `distribution`
   # attribute that points to a `tfp.distributions.Distribution` object.
-  if isinstance(tfp_dist, backend.tfp.distributions.BatchBroadcast):
+  if isinstance(tfp_dist, backend.tfd.BatchBroadcast):
     tfp_dist = tfp_dist.distribution
   # Note that `tfp.distributions.Deterministic` does not have a `quantile`
   # method implemented, so the min and max values must be extracted from the
   # `loc` attribute instead.
-  if isinstance(
-      tfp_dist,
-      backend.tfp.python.distributions.deterministic.Deterministic
-  ):
+  if isinstance(tfp_dist, backend.tfd.Deterministic):
     support_min_vals = tfp_dist.loc
     support_max_vals = tfp_dist.loc
     for i in (0, 1):
-      if (
-          prevent_deterministic_prior_at_bounds[i]
-          and np.any(tfp_dist.loc == bounds[i])
+      if prevent_deterministic_prior_at_bounds[i] and np.any(
+          tfp_dist.loc == bounds[i]
       ):
         raise ValueError(
             f'{parameter_name} was assigned a point mass (deterministic) prior'
             f' at {bounds[i]}, which is not allowed.'
         )
+  elif isinstance(tfp_dist, backend.tfd.TruncatedNormal):
+    # TruncatedNormal quantile method is not reliable, particularly when the
+    # `low` or `high` value falls into extreme percentile of the untruncated
+    # distribution. Note that
+    # `TruncatedNormal.experimental_default_event_space_bijector()([-inf, inf])`
+    # returns the correct support range, so this method could be used if the
+    # `quantile` method is found to be unreliable for other distributions.
+    support_min_vals = tfp_dist.low
+    support_max_vals = tfp_dist.high
   else:
     try:
       support_min_vals = tfp_dist.quantile(0)
@@ -1284,9 +1358,9 @@ def _validate_support(
     except (AttributeError, NotImplementedError):
       warnings.warn(
           f'The prior distribution for {parameter_name} does not have a'
-          f' `quantile` method implemented, so the support range validation'
+          ' `quantile` method implemented, so the support range validation'
           f' was skipped. Confirm that your prior for {parameter_name} is'
-          f' appropriate.'
+          ' appropriate.'
       )
       return
   if np.any(support_min_vals < bounds[0]):
@@ -1300,6 +1374,7 @@ def _validate_support(
         f' greater than the parameter maximum {bounds[1]}.'
     )
 # Dictionary of parameters that have a limited parameters space. The tuple
 # contains the lower and upper bounds, respectively.
 _parameter_space_bounds = {

google-meridian 1.2.0__py3-none-any.whl → 1.3.0__py3-none-any.whl

google-meridian 1.2.0py3-none-any.whl → 1.3.0py3-none-any.whl