PyPI - pymc-extras - Versions diffs - 0.3.1__py3-none-any.whl → 0.4.1__py3-none-any.whl - Mend

pymc-extras 0.3.1py3-none-any.whl → 0.4.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (35) hide show

pymc_extras/distributions/__init__.py +5 -5
pymc_extras/distributions/histogram_utils.py +1 -1
pymc_extras/inference/__init__.py +1 -1
pymc_extras/inference/laplace_approx/find_map.py +12 -5
pymc_extras/inference/laplace_approx/idata.py +4 -3
pymc_extras/inference/laplace_approx/laplace.py +6 -4
pymc_extras/inference/pathfinder/pathfinder.py +1 -2
pymc_extras/printing.py +1 -1
pymc_extras/statespace/__init__.py +4 -4
pymc_extras/statespace/core/__init__.py +1 -1
pymc_extras/statespace/core/representation.py +8 -8
pymc_extras/statespace/core/statespace.py +94 -23
pymc_extras/statespace/filters/__init__.py +3 -3
pymc_extras/statespace/filters/kalman_filter.py +16 -11
pymc_extras/statespace/models/SARIMAX.py +138 -74
pymc_extras/statespace/models/VARMAX.py +248 -57
pymc_extras/statespace/models/__init__.py +2 -2
pymc_extras/statespace/models/structural/__init__.py +21 -0
pymc_extras/statespace/models/structural/components/__init__.py +0 -0
pymc_extras/statespace/models/structural/components/autoregressive.py +213 -0
pymc_extras/statespace/models/structural/components/cycle.py +325 -0
pymc_extras/statespace/models/structural/components/level_trend.py +289 -0
pymc_extras/statespace/models/structural/components/measurement_error.py +154 -0
pymc_extras/statespace/models/structural/components/regression.py +257 -0
pymc_extras/statespace/models/structural/components/seasonality.py +628 -0
pymc_extras/statespace/models/structural/core.py +919 -0
pymc_extras/statespace/models/structural/utils.py +16 -0
pymc_extras/statespace/models/utilities.py +285 -0
pymc_extras/statespace/utils/constants.py +21 -18
pymc_extras/statespace/utils/data_tools.py +4 -3
{pymc_extras-0.3.1.dist-info → pymc_extras-0.4.1.dist-info}/METADATA +5 -4
{pymc_extras-0.3.1.dist-info → pymc_extras-0.4.1.dist-info}/RECORD +34 -25
pymc_extras/statespace/models/structural.py +0 -1679
{pymc_extras-0.3.1.dist-info → pymc_extras-0.4.1.dist-info}/WHEEL +0 -0
{pymc_extras-0.3.1.dist-info → pymc_extras-0.4.1.dist-info}/licenses/LICENSE +0 -0

pymc_extras/statespace/models/structural/components/measurement_error.py ADDED Viewed

@@ -0,0 +1,154 @@
+import numpy as np
+from pymc_extras.statespace.models.structural.core import Component
+class MeasurementError(Component):
+    r"""
+    Measurement error component for structural time series models.
+    This component adds observation noise to the model by introducing a variance parameter
+    that affects the observation covariance matrix H. Unlike other components, it has no
+    hidden states and should only be used in combination with other components.
+    Parameters
+    ----------
+    name : str, optional
+        Name of the measurement error component. Default is "MeasurementError".
+    observed_state_names : list[str] | None, optional
+        Names of the observed variables. If None, defaults to ["data"].
+    share_states: bool, default False
+        Whether latent states are shared across the observed states. If True, there will be only one set of latent
+        states, which are observed by all observed states. If False, each observed state has its own set of
+        latent states. This argument has no effect if `k_endog` is 1.
+    Notes
+    -----
+    The measurement error component models observation noise as:
+    .. math::
+        y_t = \text{signal}_t + \varepsilon_t, \quad \varepsilon_t \sim N(0, \sigma^2)
+    Where :math:`\text{signal}_t` is the true signal from other components and
+    :math:`\sigma^2` is the measurement error variance.
+    This component:
+        - Has no hidden states (k_states = 0)
+        - Has no innovations (k_posdef = 0)
+        - Adds a single parameter: sigma_{name}
+        - Modifies the observation covariance matrix H
+    Examples
+    --------
+    **Basic usage with trend component:**
+    .. code:: python
+        from pymc_extras.statespace import structural as st
+        import pymc as pm
+        import pytensor.tensor as pt
+        trend = st.LevelTrendComponent(order=2, innovations_order=1)
+        error = st.MeasurementError()
+        ss_mod = (trend + error).build()
+        # Use with PyMC
+        with pm.Model(coords=ss_mod.coords) as model:
+            P0 = pm.Deterministic('P0', pt.eye(ss_mod.k_states) * 10, dims=ss_mod.param_dims['P0'])
+            initial_trend = pm.Normal('initial_trend', sigma=10, dims=ss_mod.param_dims['initial_trend'])
+            sigma_obs = pm.Exponential('sigma_obs', 1, dims=ss_mod.param_dims['sigma_obs'])
+            ss_mod.build_statespace_graph(data)
+            idata = pm.sample()
+    **Multivariate measurement error:**
+    .. code:: python
+        # For multiple observed variables
+        # This creates separate measurement error variances for each variable
+        # sigma_obs_error will have shape (3,) for the three variables
+        error = st.MeasurementError(
+            name="obs_error",
+            observed_state_names=["gdp", "unemployment", "inflation"]
+        )
+    **Complete model example:**
+    .. code:: python
+        trend = st.LevelTrendComponent(order=2, innovations_order=1)
+        seasonal = st.TimeSeasonality(season_length=12, innovations=True)
+        error = st.MeasurementError()
+        model = (trend + seasonal + error).build()
+        # The model now includes:
+        # - Trend parameters: level_trend, sigma_trend
+        # - Seasonal parameters: seasonal_coefs, sigma_seasonal
+        # - Measurement error parameter: sigma_obs
+    See Also
+    --------
+    Component : Base class for all structural components.
+    StructuralTimeSeries : Complete model class.
+    """
+    def __init__(
+        self,
+        name: str = "MeasurementError",
+        observed_state_names: list[str] | None = None,
+        share_states: bool = False,
+    ):
+        if observed_state_names is None:
+            observed_state_names = ["data"]
+        self.share_states = share_states
+        k_endog = len(observed_state_names)
+        k_states = 0
+        k_posdef = 0
+        super().__init__(
+            name,
+            k_endog,
+            k_states,
+            k_posdef,
+            measurement_error=True,
+            combine_hidden_states=False,
+            observed_state_names=observed_state_names,
+            share_states=share_states,
+        )
+    def populate_component_properties(self):
+        k_endog = self.k_endog
+        k_endog_effective = 1 if self.share_states else k_endog
+        self.param_names = [f"sigma_{self.name}"]
+        self.param_dims = {}
+        self.coords = {}
+        if k_endog_effective > 1:
+            self.param_dims[f"sigma_{self.name}"] = (f"endog_{self.name}",)
+            self.coords[f"endog_{self.name}"] = self.observed_state_names
+        self.param_info = {
+            f"sigma_{self.name}": {
+                "shape": (k_endog_effective,) if k_endog_effective > 1 else (),
+                "constraints": "Positive",
+                "dims": (f"endog_{self.name}",) if k_endog_effective > 1 else None,
+            }
+        }
+    def make_symbolic_graph(self) -> None:
+        k_endog = self.k_endog
+        k_endog_effective = 1 if self.share_states else k_endog
+        sigma_shape = () if k_endog_effective == 1 else (k_endog_effective,)
+        error_sigma = self.make_and_register_variable(f"sigma_{self.name}", shape=sigma_shape)
+        diag_idx = np.diag_indices(self.k_endog)
+        idx = np.s_["obs_cov", diag_idx[0], diag_idx[1]]
+        self.ssm[idx] = error_sigma**2

pymc_extras/statespace/models/structural/components/regression.py ADDED Viewed

@@ -0,0 +1,257 @@
+import numpy as np
+from pytensor import tensor as pt
+from pymc_extras.statespace.models.structural.core import Component
+from pymc_extras.statespace.utils.constants import TIME_DIM
+class RegressionComponent(Component):
+    r"""
+    Regression component for exogenous variables in a structural time series model
+    Parameters
+    ----------
+    k_exog : int | None, default None
+        Number of exogenous variables to include in the regression. Must be specified if
+        state_names is not provided.
+    name : str | None, default "regression"
+        A name for this regression component. Used to label dimensions and coordinates.
+    state_names : list[str] | None, default None
+        List of strings for regression coefficient labels. If provided, must be of length
+        k_exog. If None and k_exog is provided, coefficients will be named
+        "{name}_1, {name}_2, ...".
+    observed_state_names : list[str] | None, default None
+        List of strings for observed state labels. If None, defaults to ["data"].
+    innovations : bool, default False
+        Whether to include stochastic innovations in the regression coefficients,
+        allowing them to vary over time. If True, coefficients follow a random walk.
+    share_states: bool, default False
+        Whether latent states are shared across the observed states. If True, there will be only one set of latent
+        states, which are observed by all observed states. If False, each observed state has its own set of
+        latent states.
+    Notes
+    -----
+    This component implements regression with exogenous variables in a structural time series
+    model. The regression component can be expressed as:
+    .. math::
+        y_t = \beta_t^T x_t + \epsilon_t
+    Where :math:`y_t` is the dependent variable, :math:`x_t` is the vector of exogenous
+    variables, :math:`\beta_t` is the vector of regression coefficients, and :math:`\epsilon_t`
+    is the error term.
+    When ``innovations=False`` (default), the coefficients are constant over time:
+    :math:`\beta_t = \beta_0` for all t.
+    When ``innovations=True``, the coefficients follow a random walk:
+    :math:`\beta_{t+1} = \beta_t + \eta_t`, where :math:`\eta_t \sim N(0, \Sigma_\beta)`.
+    The component supports both univariate and multivariate regression. In the multivariate
+    case, separate coefficients are estimated for each endogenous variable (i.e time series).
+    Examples
+    --------
+    Simple regression with constant coefficients:
+    .. code:: python
+        from pymc_extras.statespace import structural as st
+        import pymc as pm
+        import pytensor.tensor as pt
+        trend = st.LevelTrendComponent(order=1, innovations_order=1)
+        regression = st.RegressionComponent(k_exog=2, state_names=['intercept', 'slope'])
+        ss_mod = (trend + regression).build()
+        with pm.Model(coords=ss_mod.coords) as model:
+            # Prior for regression coefficients
+            betas = pm.Normal('betas', dims=ss_mod.param_dims['beta_regression'])
+            # Prior for trend innovations
+            sigma_trend = pm.Exponential('sigma_trend', 1)
+            ss_mod.build_statespace_graph(data)
+            idata = pm.sample()
+    Multivariate regression with time-varying coefficients:
+    - There are 2 exogenous variables (price and income effects)
+    - There are 2 endogenous variables (sales and revenue)
+    - The regression coefficients are allowed to vary over time (`innovations=True`)
+    .. code:: python
+        regression = st.RegressionComponent(
+            k_exog=2,
+            state_names=['price_effect', 'income_effect'],
+            observed_state_names=['sales', 'revenue'],
+            innovations=True
+        )
+        with pm.Model(coords=ss_mod.coords) as model:
+            betas = pm.Normal('betas', dims=ss_mod.param_dims['beta_regression'])
+            # Innovation variance for time-varying coefficients
+            sigma_beta = pm.Exponential('sigma_beta', 1, dims=ss_mod.param_dims['sigma_beta_regression'])
+            ss_mod.build_statespace_graph(data)
+            idata = pm.sample()
+    """
+    def __init__(
+        self,
+        k_exog: int | None = None,
+        name: str | None = "regression",
+        state_names: list[str] | None = None,
+        observed_state_names: list[str] | None = None,
+        innovations=False,
+        share_states: bool = False,
+    ):
+        self.share_states = share_states
+        if observed_state_names is None:
+            observed_state_names = ["data"]
+        self.innovations = innovations
+        k_exog = self._handle_input_data(k_exog, state_names, name)
+        k_states = k_exog
+        k_endog = len(observed_state_names)
+        k_posdef = k_exog
+        super().__init__(
+            name=name,
+            k_endog=k_endog,
+            k_states=k_states * k_endog if not share_states else k_states,
+            k_posdef=k_posdef * k_endog if not share_states else k_posdef,
+            state_names=self.state_names,
+            share_states=share_states,
+            observed_state_names=observed_state_names,
+            measurement_error=False,
+            combine_hidden_states=False,
+            exog_names=[f"data_{name}"],
+            obs_state_idxs=np.ones(k_states),
+        )
+    @staticmethod
+    def _get_state_names(k_exog: int | None, state_names: list[str] | None, name: str):
+        if k_exog is None and state_names is None:
+            raise ValueError("Must specify at least one of k_exog or state_names")
+        if state_names is not None and k_exog is not None:
+            if len(state_names) != k_exog:
+                raise ValueError(f"Expected {k_exog} state names, found {len(state_names)}")
+        elif k_exog is None:
+            k_exog = len(state_names)
+        else:
+            state_names = [f"{name}_{i + 1}" for i in range(k_exog)]
+        return k_exog, state_names
+    def _handle_input_data(self, k_exog: int, state_names: list[str] | None, name) -> int:
+        k_exog, state_names = self._get_state_names(k_exog, state_names, name)
+        self.state_names = state_names
+        return k_exog
+    def make_symbolic_graph(self) -> None:
+        k_endog = self.k_endog
+        k_endog_effective = 1 if self.share_states else k_endog
+        k_states = self.k_states // k_endog_effective
+        betas = self.make_and_register_variable(
+            f"beta_{self.name}", shape=(k_endog, k_states) if k_endog_effective > 1 else (k_states,)
+        )
+        regression_data = self.make_and_register_data(f"data_{self.name}", shape=(None, k_states))
+        self.ssm["initial_state", :] = betas.ravel()
+        self.ssm["transition", :, :] = pt.eye(self.k_states)
+        self.ssm["selection", :, :] = pt.eye(self.k_states)
+        if self.share_states:
+            self.ssm["design"] = pt.specify_shape(
+                pt.join(1, *[pt.expand_dims(regression_data, 1) for _ in range(k_endog)]),
+                (None, k_endog, self.k_states),
+            )
+        else:
+            Z = pt.linalg.block_diag(*[pt.expand_dims(regression_data, 1) for _ in range(k_endog)])
+            self.ssm["design"] = pt.specify_shape(
+                Z, (None, k_endog, regression_data.type.shape[1] * k_endog)
+            )
+        if self.innovations:
+            sigma_beta = self.make_and_register_variable(
+                f"sigma_beta_{self.name}",
+                (k_states,) if k_endog_effective == 1 else (k_endog, k_states),
+            )
+            row_idx, col_idx = np.diag_indices(self.k_states)
+            self.ssm["state_cov", row_idx, col_idx] = sigma_beta.ravel() ** 2
+    def populate_component_properties(self) -> None:
+        k_endog = self.k_endog
+        k_endog_effective = 1 if self.share_states else k_endog
+        k_states = self.k_states // k_endog_effective
+        if self.share_states:
+            self.shock_names = [f"{state_name}_shared" for state_name in self.state_names]
+        else:
+            self.shock_names = self.state_names
+        self.param_names = [f"beta_{self.name}"]
+        self.data_names = [f"data_{self.name}"]
+        self.param_dims = {
+            f"beta_{self.name}": (f"endog_{self.name}", f"state_{self.name}")
+            if k_endog_effective > 1
+            else (f"state_{self.name}",)
+        }
+        base_names = self.state_names
+        if self.share_states:
+            self.state_names = [f"{name}[{self.name}_shared]" for name in base_names]
+        else:
+            self.state_names = [
+                f"{name}[{obs_name}]"
+                for obs_name in self.observed_state_names
+                for name in base_names
+            ]
+        self.param_info = {
+            f"beta_{self.name}": {
+                "shape": (k_endog_effective, k_states) if k_endog_effective > 1 else (k_states,),
+                "constraints": None,
+                "dims": (f"endog_{self.name}", f"state_{self.name}")
+                if k_endog_effective > 1
+                else (f"state_{self.name}",),
+            },
+        }
+        self.data_info = {
+            f"data_{self.name}": {
+                "shape": (None, k_states),
+                "dims": (TIME_DIM, f"state_{self.name}"),
+            },
+        }
+        self.coords = {
+            f"state_{self.name}": base_names,
+            f"endog_{self.name}": self.observed_state_names,
+        }
+        if self.innovations:
+            self.param_names += [f"sigma_beta_{self.name}"]
+            self.param_dims[f"sigma_beta_{self.name}"] = (f"state_{self.name}",)
+            self.param_info[f"sigma_beta_{self.name}"] = {
+                "shape": (k_states,),
+                "constraints": "Positive",
+                "dims": (f"state_{self.name}",)
+                if k_endog_effective == 1
+                else (f"endog_{self.name}", f"state_{self.name}"),
+            }

pymc-extras 0.3.1__py3-none-any.whl → 0.4.1__py3-none-any.whl

pymc-extras 0.3.1py3-none-any.whl → 0.4.1py3-none-any.whl