PyPI - diff-diff - Versions diffs - 3.0.1__cp314-cp314-win_amd64.whl - Mend

diff-diff 3.0.1__cp314-cp314-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

diff_diff/__init__.py +382 -0
diff_diff/_backend.py +134 -0
diff_diff/_rust_backend.cp314-win_amd64.pyd +0 -0
diff_diff/bacon.py +1140 -0
diff_diff/bootstrap_utils.py +730 -0
diff_diff/continuous_did.py +1626 -0
diff_diff/continuous_did_bspline.py +190 -0
diff_diff/continuous_did_results.py +374 -0
diff_diff/datasets.py +815 -0
diff_diff/diagnostics.py +882 -0
diff_diff/efficient_did.py +1770 -0
diff_diff/efficient_did_bootstrap.py +359 -0
diff_diff/efficient_did_covariates.py +899 -0
diff_diff/efficient_did_results.py +368 -0
diff_diff/efficient_did_weights.py +617 -0
diff_diff/estimators.py +1501 -0
diff_diff/honest_did.py +2585 -0
diff_diff/imputation.py +2458 -0
diff_diff/imputation_bootstrap.py +418 -0
diff_diff/imputation_results.py +448 -0
diff_diff/linalg.py +2538 -0
diff_diff/power.py +2588 -0
diff_diff/practitioner.py +869 -0
diff_diff/prep.py +1738 -0
diff_diff/prep_dgp.py +1718 -0
diff_diff/pretrends.py +1105 -0
diff_diff/results.py +918 -0
diff_diff/stacked_did.py +1049 -0
diff_diff/stacked_did_results.py +339 -0
diff_diff/staggered.py +3895 -0
diff_diff/staggered_aggregation.py +864 -0
diff_diff/staggered_bootstrap.py +752 -0
diff_diff/staggered_results.py +416 -0
diff_diff/staggered_triple_diff.py +1545 -0
diff_diff/staggered_triple_diff_results.py +416 -0
diff_diff/sun_abraham.py +1685 -0
diff_diff/survey.py +1981 -0
diff_diff/synthetic_did.py +1136 -0
diff_diff/triple_diff.py +2047 -0
diff_diff/trop.py +952 -0
diff_diff/trop_global.py +1270 -0
diff_diff/trop_local.py +1307 -0
diff_diff/trop_results.py +356 -0
diff_diff/twfe.py +542 -0
diff_diff/two_stage.py +1952 -0
diff_diff/two_stage_bootstrap.py +520 -0
diff_diff/two_stage_results.py +400 -0
diff_diff/utils.py +1902 -0
diff_diff/visualization/__init__.py +61 -0
diff_diff/visualization/_common.py +328 -0
diff_diff/visualization/_continuous.py +274 -0
diff_diff/visualization/_diagnostic.py +817 -0
diff_diff/visualization/_event_study.py +1086 -0
diff_diff/visualization/_power.py +661 -0
diff_diff/visualization/_staggered.py +833 -0
diff_diff/visualization/_synthetic.py +197 -0
diff_diff/wooldridge.py +1285 -0
diff_diff/wooldridge_results.py +349 -0
diff_diff-3.0.1.dist-info/METADATA +2997 -0
diff_diff-3.0.1.dist-info/RECORD +62 -0
diff_diff-3.0.1.dist-info/WHEEL +4 -0
diff_diff-3.0.1.dist-info/sboms/diff_diff_rust.cyclonedx.json +5843 -0

diff_diff/trop_local.py ADDED Viewed

@@ -0,0 +1,1307 @@
+"""
+Local (observation-specific) estimation method for the TROP estimator.
+Contains the TROPLocalMixin class with all methods for the local
+estimation pathway, including preprocessing, distance computation,
+per-observation weight computation, model fitting, LOOCV scoring,
+and bootstrap variance estimation.
+This module is used via mixin inheritance — see trop.py for the
+main TROP class definition.
+"""
+import logging
+import warnings
+from typing import Optional, Tuple
+import numpy as np
+import pandas as pd
+logger = logging.getLogger(__name__)
+from diff_diff._backend import (
+    HAS_RUST_BACKEND,
+    _rust_bootstrap_trop_variance,
+    _rust_unit_distance_matrix,
+)
+from diff_diff.trop_results import _PrecomputedStructures
+def _validate_and_pivot_treatment(data, time, unit, treatment, all_periods, all_units):
+    """Validate treatment column and create D matrix with missing mask.
+    Rejects observed rows with missing treatment values (data quality error),
+    then pivots to (time x unit) matrix. Structural gaps from unbalanced panels
+    are filled with 0 (assumed untreated) and flagged with a warning.
+    Returns
+    -------
+    D : ndarray
+        Treatment matrix (n_periods x n_units), int.
+    missing_mask : ndarray
+        Boolean mask of structurally absent cells (n_periods x n_units).
+    """
+    n_nan_observed = int(data[treatment].isna().sum())
+    if n_nan_observed > 0:
+        raise ValueError(
+            f"{n_nan_observed} observation(s) have missing treatment values. "
+            f"TROP requires non-missing treatment indicators for all observed "
+            f"rows. Remove or impute missing values before fitting."
+        )
+    D_raw = data.pivot(index=time, columns=unit, values=treatment).reindex(
+        index=all_periods, columns=all_units
+    )
+    missing_mask = pd.isna(D_raw).values
+    n_missing_structural = int(missing_mask.sum())
+    if n_missing_structural > 0:
+        warnings.warn(
+            f"{n_missing_structural} missing treatment indicator(s) in the "
+            f"(time x unit) panel matrix filled with 0 (assumed "
+            f"untreated). This typically occurs in unbalanced panels.",
+            UserWarning,
+            stacklevel=3,
+        )
+    D = D_raw.fillna(0).astype(int).values
+    return D, missing_mask
+# Module-level convergence tolerance for SVD singular value truncation.
+# Singular values below this threshold after soft-thresholding are treated
+# as zero to improve numerical stability.
+_CONVERGENCE_TOL_SVD: float = 1e-10
+def _soft_threshold_svd(
+    M: np.ndarray,
+    threshold: float,
+    convergence_tol: float = _CONVERGENCE_TOL_SVD,
+) -> np.ndarray:
+    """
+    Apply soft-thresholding to singular values (proximal operator for nuclear norm).
+    Parameters
+    ----------
+    M : np.ndarray
+        Input matrix.
+    threshold : float
+        Soft-thresholding parameter.
+    convergence_tol : float, default=1e-10
+        Singular values below this after thresholding are treated as zero.
+    Returns
+    -------
+    np.ndarray
+        Matrix with soft-thresholded singular values.
+    """
+    if threshold <= 0:
+        return M
+    # Handle NaN/Inf values in input
+    if not np.isfinite(M).all():
+        M = np.nan_to_num(M, nan=0.0, posinf=0.0, neginf=0.0)
+    try:
+        U, s, Vt = np.linalg.svd(M, full_matrices=False)
+    except np.linalg.LinAlgError:
+        # SVD failed, return zero matrix
+        return np.zeros_like(M)
+    # Check for numerical issues in SVD output
+    if not (np.isfinite(U).all() and np.isfinite(s).all() and np.isfinite(Vt).all()):
+        # SVD produced non-finite values, return zero matrix
+        return np.zeros_like(M)
+    s_thresh = np.maximum(s - threshold, 0)
+    # Use truncated reconstruction with only non-zero singular values
+    nonzero_mask = s_thresh > convergence_tol
+    if not np.any(nonzero_mask):
+        return np.zeros_like(M)
+    # Truncate to non-zero components for numerical stability
+    U_trunc = U[:, nonzero_mask]
+    s_trunc = s_thresh[nonzero_mask]
+    Vt_trunc = Vt[nonzero_mask, :]
+    # Compute result, suppressing expected numerical warnings from
+    # ill-conditioned matrices during alternating minimization
+    with np.errstate(divide="ignore", over="ignore", invalid="ignore"):
+        result = (U_trunc * s_trunc) @ Vt_trunc
+    # Replace any NaN/Inf in result with zeros
+    if not np.isfinite(result).all():
+        result = np.nan_to_num(result, nan=0.0, posinf=0.0, neginf=0.0)
+    return result
+class TROPLocalMixin:
+    """Mixin providing local (observation-specific) estimation for TROP.
+    Methods in this mixin access the following attributes from the main
+    TROP class via ``self``:
+    - Solver params: ``max_iter``, ``tol``
+    - Inference params: ``n_bootstrap``, ``seed``
+    - State: ``_precomputed``
+    """
+    # Type hints for attributes accessed from the main TROP class
+    max_iter: int
+    tol: float
+    n_bootstrap: int
+    seed: Optional[int]
+    _precomputed: Optional[_PrecomputedStructures]
+    # Convergence tolerance for SVD singular value truncation
+    CONVERGENCE_TOL_SVD: float = 1e-10
+    # =========================================================================
+    # Preprocessing and distance computation
+    # =========================================================================
+    def _precompute_structures(
+        self,
+        Y: np.ndarray,
+        D: np.ndarray,
+        control_unit_idx: np.ndarray,
+        n_units: int,
+        n_periods: int,
+    ) -> _PrecomputedStructures:
+        """
+        Pre-compute data structures that are reused across LOOCV and estimation.
+        This method computes once what would otherwise be computed repeatedly:
+        - Pairwise unit distance matrix
+        - Time distance vectors
+        - Masks and indices
+        Parameters
+        ----------
+        Y : np.ndarray
+            Outcome matrix (n_periods x n_units).
+        D : np.ndarray
+            Treatment indicator matrix (n_periods x n_units).
+        control_unit_idx : np.ndarray
+            Indices of control units.
+        n_units : int
+            Number of units.
+        n_periods : int
+            Number of periods.
+        Returns
+        -------
+        _PrecomputedStructures
+            Pre-computed structures for efficient reuse.
+        """
+        # Compute pairwise unit distances (for all observation-specific weights)
+        # Following Equation 3 (page 7): RMSE between units over pre-treatment
+        if HAS_RUST_BACKEND and _rust_unit_distance_matrix is not None:
+            # Use Rust backend for parallel distance computation (4-8x speedup)
+            unit_dist_matrix = _rust_unit_distance_matrix(Y, D.astype(np.float64))
+        else:
+            unit_dist_matrix = self._compute_all_unit_distances(Y, D, n_units, n_periods)
+        # Pre-compute time distance vectors for each target period
+        # Time distance: |t - s| for all s and each target t
+        time_dist_matrix = np.abs(
+            np.arange(n_periods)[:, np.newaxis] - np.arange(n_periods)[np.newaxis, :]
+        )  # (n_periods, n_periods) where [t, s] = |t - s|
+        # Control and treatment masks
+        control_mask = D == 0
+        treated_mask = D == 1
+        # Identify treated observations
+        treated_observations = list(zip(*np.where(treated_mask)))
+        # Control observations for LOOCV
+        control_obs = [
+            (t, i)
+            for t in range(n_periods)
+            for i in range(n_units)
+            if control_mask[t, i] and not np.isnan(Y[t, i])
+        ]
+        return {
+            "unit_dist_matrix": unit_dist_matrix,
+            "time_dist_matrix": time_dist_matrix,
+            "control_mask": control_mask,
+            "treated_mask": treated_mask,
+            "treated_observations": treated_observations,
+            "control_obs": control_obs,
+            "control_unit_idx": control_unit_idx,
+            "D": D,
+            "Y": Y,
+            "n_units": n_units,
+            "n_periods": n_periods,
+        }
+    def _compute_all_unit_distances(
+        self,
+        Y: np.ndarray,
+        D: np.ndarray,
+        n_units: int,
+        n_periods: int,
+    ) -> np.ndarray:
+        """
+        Compute pairwise unit distance matrix using vectorized operations.
+        Following Equation 3 (page 7):
+        dist_unit_{-t}(j, i) = sqrt(sum_u (Y_{iu} - Y_{ju})^2 / n_valid)
+        For efficiency, we compute a base distance matrix excluding all treated
+        observations, which provides a good approximation. The exact per-observation
+        distances are refined when needed.
+        Uses vectorized numpy operations with masked arrays for O(n^2) complexity
+        but with highly optimized inner loops via numpy/BLAS.
+        Parameters
+        ----------
+        Y : np.ndarray
+            Outcome matrix (n_periods x n_units).
+        D : np.ndarray
+            Treatment indicator matrix (n_periods x n_units).
+        n_units : int
+            Number of units.
+        n_periods : int
+            Number of periods.
+        Returns
+        -------
+        np.ndarray
+            Pairwise distance matrix (n_units x n_units).
+        """
+        # Mask for valid observations: control periods only (D=0), non-NaN
+        valid_mask = (D == 0) & ~np.isnan(Y)
+        # Replace invalid values with NaN for masked computation
+        Y_masked = np.where(valid_mask, Y, np.nan)
+        # Transpose to (n_units, n_periods) for easier broadcasting
+        Y_T = Y_masked.T  # (n_units, n_periods)
+        # Compute pairwise squared differences using broadcasting
+        # Y_T[:, np.newaxis, :] has shape (n_units, 1, n_periods)
+        # Y_T[np.newaxis, :, :] has shape (1, n_units, n_periods)
+        # diff has shape (n_units, n_units, n_periods)
+        diff = Y_T[:, np.newaxis, :] - Y_T[np.newaxis, :, :]
+        sq_diff = diff**2
+        # Count valid (non-NaN) observations per pair
+        # A difference is valid only if both units have valid observations
+        valid_diff = ~np.isnan(sq_diff)
+        n_valid = np.sum(valid_diff, axis=2)  # (n_units, n_units)
+        # Compute sum of squared differences (treating NaN as 0)
+        sq_diff_sum = np.nansum(sq_diff, axis=2)  # (n_units, n_units)
+        # Compute RMSE distance: sqrt(sum / n_valid)
+        # Avoid division by zero
+        with np.errstate(divide="ignore", invalid="ignore"):
+            dist_matrix = np.sqrt(sq_diff_sum / n_valid)
+        # Set pairs with no valid observations to inf
+        dist_matrix = np.where(n_valid > 0, dist_matrix, np.inf)
+        # Ensure diagonal is 0 (same unit distance)
+        np.fill_diagonal(dist_matrix, 0.0)
+        return dist_matrix
+    def _compute_unit_distance_for_obs(
+        self,
+        Y: np.ndarray,
+        D: np.ndarray,
+        j: int,
+        i: int,
+        target_period: int,
+    ) -> float:
+        """
+        Compute observation-specific pairwise distance from unit j to unit i.
+        This is the exact computation from Equation 3, excluding the target period.
+        Used when the base distance matrix approximation is insufficient.
+        Parameters
+        ----------
+        Y : np.ndarray
+            Outcome matrix (n_periods x n_units).
+        D : np.ndarray
+            Treatment indicator matrix.
+        j : int
+            Control unit index.
+        i : int
+            Treated unit index.
+        target_period : int
+            Target period to exclude.
+        Returns
+        -------
+        float
+            Pairwise RMSE distance.
+        """
+        n_periods = Y.shape[0]
+        # Mask: exclude target period, both units must be untreated, non-NaN
+        valid = np.ones(n_periods, dtype=bool)
+        valid[target_period] = False
+        valid &= (D[:, i] == 0) & (D[:, j] == 0)
+        valid &= ~np.isnan(Y[:, i]) & ~np.isnan(Y[:, j])
+        if np.any(valid):
+            sq_diffs = (Y[valid, i] - Y[valid, j]) ** 2
+            return np.sqrt(np.mean(sq_diffs))
+        else:
+            return np.inf
+    # =========================================================================
+    # Observation-specific estimation
+    # =========================================================================
+    def _compute_observation_weights(
+        self,
+        Y: np.ndarray,
+        D: np.ndarray,
+        i: int,
+        t: int,
+        lambda_time: float,
+        lambda_unit: float,
+        control_unit_idx: np.ndarray,
+        n_units: int,
+        n_periods: int,
+    ) -> np.ndarray:
+        """
+        Compute observation-specific weight matrix for treated observation (i, t).
+        Following the paper's Algorithm 2 (page 27) and Equation 2 (page 7):
+        - Time weights theta_s^{i,t} = exp(-lambda_time * |t - s|)
+        - Unit weights omega_j^{i,t} = exp(-lambda_unit * dist_unit_{-t}(j, i))
+        IMPORTANT (Issue A fix): The paper's objective sums over ALL observations
+        where (1 - W_js) is non-zero, which includes pre-treatment observations of
+        eventually-treated units since W_js = 0 for those. This method computes
+        weights for ALL units where D[t, j] = 0 at the target period, not just
+        never-treated units.
+        Uses pre-computed structures when available for efficiency.
+        Parameters
+        ----------
+        Y : np.ndarray
+            Outcome matrix (n_periods x n_units).
+        D : np.ndarray
+            Treatment indicator matrix (n_periods x n_units).
+        i : int
+            Treated unit index.
+        t : int
+            Treatment period index.
+        lambda_time : float
+            Time weight decay parameter.
+        lambda_unit : float
+            Unit weight decay parameter.
+        control_unit_idx : np.ndarray
+            Indices of never-treated units (for backward compatibility, but not
+            used for weight computation - we use D matrix directly).
+        n_units : int
+            Number of units.
+        n_periods : int
+            Number of periods.
+        Returns
+        -------
+        np.ndarray
+            Weight matrix (n_periods x n_units) for observation (i, t).
+        """
+        # Use pre-computed structures when available
+        if self._precomputed is not None:
+            # Time weights from pre-computed time distance matrix
+            # time_dist_matrix[t, s] = |t - s|
+            time_weights = np.exp(-lambda_time * self._precomputed["time_dist_matrix"][t, :])
+            # Unit weights - computed for ALL units where D[t, j] = 0
+            # (Issue A fix: includes pre-treatment obs of eventually-treated units)
+            unit_weights = np.zeros(n_units)
+            D_stored = self._precomputed["D"]
+            Y_stored = self._precomputed["Y"]
+            # Valid control units at time t: D[t, j] == 0
+            valid_control_at_t = D_stored[t, :] == 0
+            if lambda_unit == 0:
+                # Uniform weights when lambda_unit = 0
+                # All units not treated at time t get weight 1
+                unit_weights[valid_control_at_t] = 1.0
+            else:
+                # Use observation-specific distances with target period excluded
+                # (Issue B fix: compute exact per-observation distance)
+                for j in range(n_units):
+                    if valid_control_at_t[j] and j != i:
+                        # Compute distance excluding target period t
+                        dist = self._compute_unit_distance_for_obs(Y_stored, D_stored, j, i, t)
+                        if np.isinf(dist):
+                            unit_weights[j] = 0.0
+                        else:
+                            unit_weights[j] = np.exp(-lambda_unit * dist)
+            # Treated unit i gets weight 1
+            unit_weights[i] = 1.0
+            # Weight matrix: outer product (n_periods x n_units)
+            return np.outer(time_weights, unit_weights)
+        # Fallback: compute from scratch (used in bootstrap)
+        # Time distance: |t - s| following paper's Equation 3 (page 7)
+        dist_time = np.abs(np.arange(n_periods) - t)
+        time_weights = np.exp(-lambda_time * dist_time)
+        # Unit weights - computed for ALL units where D[t, j] = 0
+        # (Issue A fix: includes pre-treatment obs of eventually-treated units)
+        unit_weights = np.zeros(n_units)
+        # Valid control units at time t: D[t, j] == 0
+        valid_control_at_t = D[t, :] == 0
+        if lambda_unit == 0:
+            # Uniform weights when lambda_unit = 0
+            unit_weights[valid_control_at_t] = 1.0
+        else:
+            for j in range(n_units):
+                if valid_control_at_t[j] and j != i:
+                    # Compute distance excluding target period t (Issue B fix)
+                    dist = self._compute_unit_distance_for_obs(Y, D, j, i, t)
+                    if np.isinf(dist):
+                        unit_weights[j] = 0.0
+                    else:
+                        unit_weights[j] = np.exp(-lambda_unit * dist)
+        # Treated unit i gets weight 1 (or could be omitted since we fit on controls)
+        # We include treated unit's own observation for model fitting
+        unit_weights[i] = 1.0
+        # Weight matrix: outer product (n_periods x n_units)
+        W = np.outer(time_weights, unit_weights)
+        return W
+    def _soft_threshold_svd(
+        self,
+        M: np.ndarray,
+        threshold: float,
+    ) -> np.ndarray:
+        """Delegate to module-level ``_soft_threshold_svd``."""
+        return _soft_threshold_svd(M, threshold, self.CONVERGENCE_TOL_SVD)
+    def _weighted_nuclear_norm_solve(
+        self,
+        Y: np.ndarray,
+        W: np.ndarray,
+        L_init: np.ndarray,
+        alpha: np.ndarray,
+        beta: np.ndarray,
+        lambda_nn: float,
+        max_inner_iter: int = 20,
+    ) -> np.ndarray:
+        """
+        Solve weighted nuclear norm problem using iterative weighted soft-impute.
+        Issue C fix: Implements the weighted nuclear norm optimization from the
+        paper's Equation 2 (page 7). The full objective is:
+            min_L sum W_{ti}(R_{ti} - L_{ti})^2 + lambda_nn||L||_*
+        This uses proximal gradient descent (Mazumder et al. 2010) with
+        FISTA/Nesterov acceleration. Lipschitz constant L_f = 2*max(W),
+        step size eta = 1/(2*max(W)), proximal threshold eta*lambda_nn:
+            G_k = L_k + (W/max(W)) * (R - L_k)
+            L_{k+1} = prox_{eta*lambda_nn*||*||_*}(G_k)
+        IMPORTANT: For observations with W=0 (treated observations), we keep
+        L values from the previous iteration rather than setting L = R, which
+        would absorb the treatment effect.
+        Parameters
+        ----------
+        Y : np.ndarray
+            Outcome matrix (n_periods x n_units).
+        W : np.ndarray
+            Weight matrix (n_periods x n_units), non-negative. W=0 indicates
+            observations that should not be used for fitting (treated obs).
+        L_init : np.ndarray
+            Initial estimate of L matrix.
+        alpha : np.ndarray
+            Current unit fixed effects estimate.
+        beta : np.ndarray
+            Current time fixed effects estimate.
+        lambda_nn : float
+            Nuclear norm regularization parameter.
+        max_inner_iter : int, default=20
+            Maximum inner iterations for the proximal algorithm.
+        Returns
+        -------
+        np.ndarray
+            Updated L matrix estimate.
+        """
+        # Compute target residual R = Y - alpha - beta
+        R = Y - alpha[np.newaxis, :] - beta[:, np.newaxis]
+        # Handle invalid values
+        R = np.nan_to_num(R, nan=0.0, posinf=0.0, neginf=0.0)
+        # For observations with W=0 (treated obs), keep L_init instead of R
+        # This prevents L from absorbing the treatment effect
+        valid_obs_mask = W > 0
+        R_masked = np.where(valid_obs_mask, R, L_init)
+        if lambda_nn <= 0:
+            # No regularization - just return masked residual
+            # Use soft-thresholding with threshold=0 which returns the input
+            return R_masked
+        # Normalize weights so max is 1 (for step size stability)
+        W_max = np.max(W)
+        if W_max > 0:
+            W_norm = W / W_max
+        else:
+            W_norm = W
+        # Initialize L
+        L = L_init.copy()
+        L_prev = L.copy()
+        t_fista = 1.0
+        # Proximal gradient iteration with FISTA/Nesterov acceleration
+        # This solves: min_L ||W^{1/2} * (R - L)||_F^2 + lambda||L||_*
+        # Lipschitz constant L_f = 2*max(W), so eta = 1/(2*max(W))
+        # Threshold = eta*lambda_nn = lambda_nn/(2*max(W))
+        for _ in range(max_inner_iter):
+            L_old = L.copy()
+            # FISTA momentum
+            t_fista_new = (1.0 + np.sqrt(1.0 + 4.0 * t_fista**2)) / 2.0
+            momentum = (t_fista - 1.0) / t_fista_new
+            L_momentum = L + momentum * (L - L_prev)
+            # Gradient step from momentum point: L_m + W * (R - L_m)
+            # For W=0 observations, this keeps L_m unchanged
+            gradient_step = L_momentum + W_norm * (R_masked - L_momentum)
+            # Proximal step: soft-threshold singular values
+            L_prev = L.copy()
+            threshold = lambda_nn / (2.0 * W_max) if W_max > 0 else lambda_nn / 2.0
+            L = self._soft_threshold_svd(gradient_step, threshold)
+            t_fista = t_fista_new
+            # Check convergence
+            if np.max(np.abs(L - L_old)) < self.tol:
+                break
+        return L
+    def _estimate_model(
+        self,
+        Y: np.ndarray,
+        control_mask: np.ndarray,
+        weight_matrix: np.ndarray,
+        lambda_nn: float,
+        n_units: int,
+        n_periods: int,
+        exclude_obs: Optional[Tuple[int, int]] = None,
+    ) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
+        """
+        Estimate the model: Y = alpha + beta + L + tau*D + eps with nuclear norm penalty on L.
+        Uses alternating minimization with vectorized operations:
+        1. Fix L, solve for alpha, beta via weighted means
+        2. Fix alpha, beta, solve for L via soft-thresholding
+        Parameters
+        ----------
+        Y : np.ndarray
+            Outcome matrix (n_periods x n_units).
+        control_mask : np.ndarray
+            Boolean mask for control observations.
+        weight_matrix : np.ndarray
+            Pre-computed global weight matrix (n_periods x n_units).
+        lambda_nn : float
+            Nuclear norm regularization parameter.
+        n_units : int
+            Number of units.
+        n_periods : int
+            Number of periods.
+        exclude_obs : tuple, optional
+            (t, i) observation to exclude (for LOOCV).
+        Returns
+        -------
+        tuple
+            (alpha, beta, L) estimated parameters.
+        """
+        W = weight_matrix
+        # Mask for estimation (control obs only, excluding LOOCV obs if specified)
+        est_mask = control_mask.copy()
+        if exclude_obs is not None:
+            t_ex, i_ex = exclude_obs
+            est_mask[t_ex, i_ex] = False
+        # Handle missing values
+        valid_mask = ~np.isnan(Y) & est_mask
+        # Initialize
+        alpha = np.zeros(n_units)
+        beta = np.zeros(n_periods)
+        L = np.zeros((n_periods, n_units))
+        # Pre-compute masked weights for vectorized operations
+        # Set weights to 0 where not valid
+        W_masked = W * valid_mask
+        # Pre-compute weight sums per unit and per time (for denominator)
+        # shape: (n_units,) and (n_periods,)
+        weight_sum_per_unit = np.sum(W_masked, axis=0)  # sum over periods
+        weight_sum_per_time = np.sum(W_masked, axis=1)  # sum over units
+        # Handle units/periods with zero weight sum
+        unit_has_obs = weight_sum_per_unit > 0
+        time_has_obs = weight_sum_per_time > 0
+        # Create safe denominators (avoid division by zero)
+        safe_unit_denom = np.where(unit_has_obs, weight_sum_per_unit, 1.0)
+        safe_time_denom = np.where(time_has_obs, weight_sum_per_time, 1.0)
+        # Replace NaN in Y with 0 for computation (mask handles exclusion)
+        Y_safe = np.where(np.isnan(Y), 0.0, Y)
+        # Alternating minimization following Algorithm 1 (page 9)
+        # Minimize: sum W_{ti}(Y_{ti} - alpha_i - beta_t - L_{ti})^2 + lambda_nn||L||_*
+        for _ in range(self.max_iter):
+            alpha_old = alpha.copy()
+            beta_old = beta.copy()
+            L_old = L.copy()
+            # Step 1: Update alpha and beta (weighted least squares)
+            # Following Equation 2 (page 7), fix L and solve for alpha, beta
+            # R = Y - L (residual without fixed effects)
+            R = Y_safe - L
+            # Alpha update (unit fixed effects):
+            # alpha_i = argmin_alpha sum_t W_{ti}(R_{ti} - alpha - beta_t)^2
+            # Solution: alpha_i = sum_t W_{ti}(R_{ti} - beta_t) / sum_t W_{ti}
+            R_minus_beta = R - beta[:, np.newaxis]  # (n_periods, n_units)
+            weighted_R_minus_beta = W_masked * R_minus_beta
+            alpha_numerator = np.sum(weighted_R_minus_beta, axis=0)  # (n_units,)
+            alpha = np.where(unit_has_obs, alpha_numerator / safe_unit_denom, 0.0)
+            # Beta update (time fixed effects):
+            # beta_t = argmin_beta sum_i W_{ti}(R_{ti} - alpha_i - beta)^2
+            # Solution: beta_t = sum_i W_{ti}(R_{ti} - alpha_i) / sum_i W_{ti}
+            R_minus_alpha = R - alpha[np.newaxis, :]  # (n_periods, n_units)
+            weighted_R_minus_alpha = W_masked * R_minus_alpha
+            beta_numerator = np.sum(weighted_R_minus_alpha, axis=1)  # (n_periods,)
+            beta = np.where(time_has_obs, beta_numerator / safe_time_denom, 0.0)
+            # Step 2: Update L with weighted nuclear norm penalty
+            # Issue C fix: Use weighted soft-impute to properly account for
+            # observation weights in the nuclear norm optimization.
+            # Following Equation 2 (page 7): min_L sum W_{ti}(Y - alpha - beta - L)^2 + lambda||L||_*
+            L = self._weighted_nuclear_norm_solve(
+                Y_safe, W_masked, L, alpha, beta, lambda_nn, max_inner_iter=10
+            )
+            # Check convergence
+            alpha_diff = np.max(np.abs(alpha - alpha_old))
+            beta_diff = np.max(np.abs(beta - beta_old))
+            L_diff = np.max(np.abs(L - L_old))
+            if max(alpha_diff, beta_diff, L_diff) < self.tol:
+                break
+        return alpha, beta, L
+    def _loocv_score_obs_specific(
+        self,
+        Y: np.ndarray,
+        D: np.ndarray,
+        control_mask: np.ndarray,
+        control_unit_idx: np.ndarray,
+        lambda_time: float,
+        lambda_unit: float,
+        lambda_nn: float,
+        n_units: int,
+        n_periods: int,
+    ) -> float:
+        """
+        Compute leave-one-out cross-validation score with observation-specific weights.
+        Following the paper's Equation 5 (page 8):
+        Q(lambda) = sum_{j,s: D_js=0} [tau_js^loocv(lambda)]^2
+        For each control observation (j, s), treat it as pseudo-treated,
+        compute observation-specific weights, fit model excluding (j, s),
+        and sum squared pseudo-treatment effects.
+        Uses pre-computed structures when available for efficiency.
+        Parameters
+        ----------
+        Y : np.ndarray
+            Outcome matrix (n_periods x n_units).
+        D : np.ndarray
+            Treatment indicator matrix (n_periods x n_units).
+        control_mask : np.ndarray
+            Boolean mask for control observations.
+        control_unit_idx : np.ndarray
+            Indices of control units.
+        lambda_time : float
+            Time weight decay parameter.
+        lambda_unit : float
+            Unit weight decay parameter.
+        lambda_nn : float
+            Nuclear norm regularization parameter.
+        n_units : int
+            Number of units.
+        n_periods : int
+            Number of periods.
+        Returns
+        -------
+        float
+            LOOCV score (lower is better).
+        """
+        # Use pre-computed control observations if available
+        if self._precomputed is not None:
+            control_obs = self._precomputed["control_obs"]
+        else:
+            # Get all control observations
+            control_obs = [
+                (t, i)
+                for t in range(n_periods)
+                for i in range(n_units)
+                if control_mask[t, i] and not np.isnan(Y[t, i])
+            ]
+        # Empty control set check: if no control observations, return infinity
+        # A score of 0.0 would incorrectly "win" over legitimate parameters
+        if len(control_obs) == 0:
+            warnings.warn(
+                f"LOOCV: No valid control observations for "
+                f"\u03bb=({lambda_time}, {lambda_unit}, {lambda_nn}). "
+                "Returning infinite score.",
+                UserWarning,
+            )
+            return np.inf
+        tau_squared_sum = 0.0
+        n_valid = 0
+        for t, i in control_obs:
+            try:
+                # Compute observation-specific weights for pseudo-treated (i, t)
+                # Uses pre-computed distance matrices when available
+                weight_matrix = self._compute_observation_weights(
+                    Y, D, i, t, lambda_time, lambda_unit, control_unit_idx, n_units, n_periods
+                )
+                # Estimate model excluding observation (t, i)
+                alpha, beta, L = self._estimate_model(
+                    Y,
+                    control_mask,
+                    weight_matrix,
+                    lambda_nn,
+                    n_units,
+                    n_periods,
+                    exclude_obs=(t, i),
+                )
+                # Pseudo treatment effect
+                tau_ti = Y[t, i] - alpha[i] - beta[t] - L[t, i]
+                tau_squared_sum += tau_ti**2
+                n_valid += 1
+            except (np.linalg.LinAlgError, ValueError):
+                # Per Equation 5: Q(lambda) must sum over ALL D==0 cells
+                # Any failure means this lambda cannot produce valid estimates for all cells
+                warnings.warn(
+                    f"LOOCV: Fit failed for observation ({t}, {i}) with "
+                    f"\u03bb=({lambda_time}, {lambda_unit}, {lambda_nn}). "
+                    "Returning infinite score per Equation 5.",
+                    UserWarning,
+                )
+                return np.inf
+        # Return SUM of squared pseudo-treatment effects per Equation 5 (page 8):
+        # Q(lambda) = sum_{j,s: D_js=0} [tau_js^loocv(lambda)]^2
+        return tau_squared_sum
+    def _bootstrap_variance(
+        self,
+        data: pd.DataFrame,
+        outcome: str,
+        treatment: str,
+        unit: str,
+        time: str,
+        optimal_lambda: Tuple[float, float, float],
+        Y: Optional[np.ndarray] = None,
+        D: Optional[np.ndarray] = None,
+        control_unit_idx: Optional[np.ndarray] = None,
+        survey_design=None,
+        unit_weight_arr: Optional[np.ndarray] = None,
+        resolved_survey=None,
+    ) -> Tuple[float, np.ndarray]:
+        """
+        Compute bootstrap standard error using unit-level block bootstrap.
+        When the optional Rust backend is available and the matrix parameters
+        (Y, D, control_unit_idx) are provided, uses parallelized Rust
+        implementation for 5-15x speedup. Falls back to Python implementation
+        if Rust is unavailable or if matrix parameters are not provided.
+        When a full survey design (strata/PSU/FPC) is present, uses Rao-Wu
+        rescaled bootstrap instead, which skips the Rust path.
+        Parameters
+        ----------
+        data : pd.DataFrame
+            Original data in long format with unit, time, outcome, and treatment.
+        outcome : str
+            Name of the outcome column in data.
+        treatment : str
+            Name of the treatment indicator column in data.
+        unit : str
+            Name of the unit identifier column in data.
+        time : str
+            Name of the time period column in data.
+        optimal_lambda : tuple of float
+            Optimal tuning parameters (lambda_time, lambda_unit, lambda_nn)
+            from cross-validation. Used for model estimation in each bootstrap.
+        Y : np.ndarray, optional
+            Outcome matrix of shape (n_periods, n_units). Required for Rust
+            backend acceleration. If None, falls back to Python implementation.
+        D : np.ndarray, optional
+            Treatment indicator matrix of shape (n_periods, n_units) where
+            D[t,i]=1 indicates unit i is treated at time t. Required for Rust
+            backend acceleration.
+        control_unit_idx : np.ndarray, optional
+            Array of indices for control units (never-treated). Required for
+            Rust backend acceleration.
+        survey_design : SurveyDesign, optional
+            Survey design specification.
+        unit_weight_arr : np.ndarray, optional
+            Unit-level survey weights.
+        resolved_survey : ResolvedSurveyDesign, optional
+            Resolved survey design (observation-level).
+        Returns
+        -------
+        se : float
+            Bootstrap standard error of the ATT estimate.
+        bootstrap_estimates : np.ndarray
+            Array of ATT estimates from each bootstrap iteration. Length may
+            be less than n_bootstrap if some iterations failed.
+        Notes
+        -----
+        Uses unit-level block bootstrap where entire unit time series are
+        resampled with replacement. This preserves within-unit correlation
+        structure and is appropriate for panel data.
+        """
+        lambda_time, lambda_unit, lambda_nn = optimal_lambda
+        # Check for full survey design (strata/PSU/FPC present)
+        _has_full_design = resolved_survey is not None and (
+            resolved_survey.strata is not None
+            or resolved_survey.psu is not None
+            or resolved_survey.fpc is not None
+        )
+        # Full survey design: use Python Rao-Wu rescaled bootstrap
+        if _has_full_design:
+            return self._bootstrap_rao_wu_local(
+                data,
+                outcome,
+                treatment,
+                unit,
+                time,
+                optimal_lambda,
+                resolved_survey,
+                survey_design,
+            )
+        # Try Rust backend for parallel bootstrap (5-15x speedup)
+        # Only used for pweight-only designs (no strata/PSU/FPC)
+        if (
+            HAS_RUST_BACKEND
+            and _rust_bootstrap_trop_variance is not None
+            and self._precomputed is not None
+            and Y is not None
+            and D is not None
+        ):
+            try:
+                control_mask = self._precomputed["control_mask"]
+                time_dist_matrix = self._precomputed["time_dist_matrix"].astype(np.int64)
+                bootstrap_estimates, se = _rust_bootstrap_trop_variance(
+                    Y,
+                    D.astype(np.float64),
+                    control_mask.astype(np.uint8),
+                    time_dist_matrix,
+                    lambda_time,
+                    lambda_unit,
+                    lambda_nn,
+                    self.n_bootstrap,
+                    self.max_iter,
+                    self.tol,
+                    self.seed if self.seed is not None else 0,
+                    unit_weight_arr,
+                )
+                if len(bootstrap_estimates) >= 10:
+                    return float(se), bootstrap_estimates
+                # Fall through to Python if too few bootstrap samples
+                logger.debug(
+                    "Rust bootstrap returned only %d samples, falling back to Python",
+                    len(bootstrap_estimates),
+                )
+            except Exception as e:
+                logger.debug("Rust bootstrap variance failed, falling back to Python: %s", e)
+                warnings.warn(
+                    f"Rust backend failed for bootstrap variance; "
+                    f"falling back to Python. Performance may be reduced. "
+                    f"Error: {e}",
+                    UserWarning,
+                    stacklevel=2,
+                )
+        # Python implementation (fallback)
+        rng = np.random.default_rng(self.seed)
+        # Issue D fix: Stratified bootstrap sampling
+        # Paper's Algorithm 3 (page 27) specifies sampling N_0 control rows
+        # and N_1 treated rows separately to preserve treatment ratio
+        unit_ever_treated = data.groupby(unit)[treatment].max()
+        treated_units = np.array(unit_ever_treated[unit_ever_treated == 1].index)
+        control_units = np.array(unit_ever_treated[unit_ever_treated == 0].index)
+        n_treated_units = len(treated_units)
+        n_control_units = len(control_units)
+        bootstrap_estimates_list = []
+        for _ in range(self.n_bootstrap):
+            # Stratified sampling: sample control and treated units separately
+            # This preserves the treatment ratio in each bootstrap sample
+            if n_control_units > 0:
+                sampled_control = rng.choice(control_units, size=n_control_units, replace=True)
+            else:
+                sampled_control = np.array([], dtype=control_units.dtype)
+            if n_treated_units > 0:
+                sampled_treated = rng.choice(treated_units, size=n_treated_units, replace=True)
+            else:
+                sampled_treated = np.array([], dtype=treated_units.dtype)
+            # Combine stratified samples
+            sampled_units = np.concatenate([sampled_control, sampled_treated])
+            # Create bootstrap sample with unique unit IDs
+            boot_data = pd.concat(
+                [
+                    data[data[unit] == u].assign(**{unit: f"{u}_{idx}"})
+                    for idx, u in enumerate(sampled_units)
+                ],
+                ignore_index=True,
+            )
+            try:
+                # Fit with fixed lambda (skip LOOCV for speed)
+                att = self._fit_with_fixed_lambda(
+                    boot_data,
+                    outcome,
+                    treatment,
+                    unit,
+                    time,
+                    optimal_lambda,
+                    survey_design=survey_design,
+                )
+                if np.isfinite(att):
+                    bootstrap_estimates_list.append(att)
+            except (ValueError, np.linalg.LinAlgError, KeyError):
+                continue
+        bootstrap_estimates = np.array(bootstrap_estimates_list)
+        if len(bootstrap_estimates) < 10:
+            warnings.warn(
+                f"Only {len(bootstrap_estimates)} bootstrap iterations succeeded. "
+                "Standard errors may be unreliable.",
+                UserWarning,
+            )
+            if len(bootstrap_estimates) == 0:
+                return np.nan, np.array([])
+        se = np.std(bootstrap_estimates, ddof=1)
+        return float(se), bootstrap_estimates
+    def _bootstrap_rao_wu_local(
+        self,
+        data: pd.DataFrame,
+        outcome: str,
+        treatment: str,
+        unit: str,
+        time: str,
+        optimal_lambda: Tuple[float, float, float],
+        resolved_survey,
+        survey_design,
+    ) -> Tuple[float, np.ndarray]:
+        """
+        Rao-Wu rescaled bootstrap for local method with full survey design.
+        Instead of physically resampling units, each iteration generates
+        rescaled observation weights via Rao-Wu (1988) weight perturbation.
+        Cross-classifies survey strata with treatment group to preserve
+        the stratified resampling structure.
+        Parameters
+        ----------
+        data : pd.DataFrame
+            Original data.
+        outcome, treatment, unit, time : str
+            Column names.
+        optimal_lambda : tuple
+            Optimal tuning parameters (lambda_time, lambda_unit, lambda_nn).
+        resolved_survey : ResolvedSurveyDesign
+            Resolved survey design (observation-level).
+        survey_design : SurveyDesign
+            Original survey design specification.
+        Returns
+        -------
+        Tuple[float, np.ndarray]
+            (se, bootstrap_estimates).
+        """
+        import warnings
+        from diff_diff.bootstrap_utils import generate_rao_wu_weights
+        from diff_diff.linalg import _factorize_cluster_ids
+        from diff_diff.survey import ResolvedSurveyDesign
+        rng = np.random.default_rng(self.seed)
+        # Build unit-level resolved survey with cross-classified strata
+        all_units = sorted(data[unit].unique())
+        n_units = len(all_units)
+        # Determine treatment status per unit
+        unit_ever_treated = data.groupby(unit)[treatment].max()
+        treatment_group = np.array([int(unit_ever_treated[u]) for u in all_units], dtype=np.int64)
+        # Extract unit-level survey design fields
+        first_rows = data.groupby(unit).first().loc[all_units]
+        # Weights (unit-level)
+        if survey_design.weights is not None:
+            unit_weights = first_rows[survey_design.weights].values.astype(np.float64)
+        else:
+            unit_weights = np.ones(n_units, dtype=np.float64)
+        # Strata: cross-classify survey strata x treatment group
+        if survey_design.strata is not None:
+            survey_strata = first_rows[survey_design.strata].values
+            cross_labels = np.array([f"{s}_{g}" for s, g in zip(survey_strata, treatment_group)])
+            cross_strata = _factorize_cluster_ids(cross_labels)
+        else:
+            # No survey strata: use treatment group as strata
+            cross_strata = treatment_group.copy()
+        n_strata = len(np.unique(cross_strata))
+        # PSU (unit-level)
+        psu_arr = None
+        n_psu = 0
+        if survey_design.psu is not None:
+            psu_raw = first_rows[survey_design.psu].values
+            if survey_design.nest and survey_design.strata is not None:
+                combined = np.array([f"{s}_{p}" for s, p in zip(cross_strata, psu_raw)])
+                psu_arr = _factorize_cluster_ids(combined)
+            else:
+                psu_arr = _factorize_cluster_ids(psu_raw)
+            n_psu = len(np.unique(psu_arr))
+        else:
+            # Implicit PSU: each unit is its own PSU
+            psu_arr = np.arange(n_units, dtype=np.int64)
+            n_psu = n_units
+        # FPC (unit-level)
+        fpc_arr = None
+        if survey_design.fpc is not None:
+            fpc_arr = first_rows[survey_design.fpc].values.astype(np.float64)
+        unit_resolved = ResolvedSurveyDesign(
+            weights=unit_weights,
+            weight_type=resolved_survey.weight_type,
+            strata=cross_strata,
+            psu=psu_arr,
+            fpc=fpc_arr,
+            n_strata=n_strata,
+            n_psu=n_psu,
+            lonely_psu=resolved_survey.lonely_psu,
+        )
+        # Check for unidentified variance (single unstratified PSU)
+        if (
+            survey_design.psu is not None
+            and unit_resolved.n_psu < 2
+            and survey_design.strata is None
+        ):
+            return np.nan, np.array([])
+        # Bootstrap loop: refit the full model per draw with Rao-Wu rescaled
+        # weights, mirroring the physical-resampling bootstrap but using weight
+        # perturbation instead of unit resampling.
+        bootstrap_estimates_list = []
+        for _ in range(self.n_bootstrap):
+            try:
+                # Generate Rao-Wu rescaled unit weights
+                boot_weights = generate_rao_wu_weights(unit_resolved, rng)
+                # Skip if all weights are zero
+                if boot_weights.sum() == 0:
+                    continue
+                # Refit the full local model with rescaled weights
+                att = self._fit_with_fixed_lambda(
+                    data,
+                    outcome,
+                    treatment,
+                    unit,
+                    time,
+                    optimal_lambda,
+                    survey_design=survey_design,
+                    unit_weight_arr=boot_weights,
+                )
+                if np.isfinite(att):
+                    bootstrap_estimates_list.append(att)
+            except (ValueError, np.linalg.LinAlgError, KeyError):
+                continue
+        bootstrap_estimates = np.array(bootstrap_estimates_list)
+        if len(bootstrap_estimates) < 10:
+            warnings.warn(
+                f"Only {len(bootstrap_estimates)} bootstrap iterations succeeded. "
+                "Standard errors may be unreliable.",
+                UserWarning,
+            )
+            if len(bootstrap_estimates) == 0:
+                return np.nan, np.array([])
+        se = np.std(bootstrap_estimates, ddof=1)
+        return float(se), bootstrap_estimates
+    def _fit_with_fixed_lambda(
+        self,
+        data: pd.DataFrame,
+        outcome: str,
+        treatment: str,
+        unit: str,
+        time: str,
+        fixed_lambda: Tuple[float, float, float],
+        survey_design=None,
+        unit_weight_arr: Optional[np.ndarray] = None,
+    ) -> float:
+        """
+        Fit model with fixed tuning parameters (for bootstrap).
+        Uses observation-specific weights following Algorithm 2.
+        Returns only the ATT estimate.
+        Parameters
+        ----------
+        unit_weight_arr : np.ndarray, optional
+            Pre-computed unit-level weights (e.g. Rao-Wu rescaled weights).
+            When provided, overrides weights extracted from survey_design.
+        """
+        lambda_time, lambda_unit, lambda_nn = fixed_lambda
+        # Use pre-computed weights if provided (e.g. Rao-Wu bootstrap),
+        # otherwise extract from survey_design.
+        if unit_weight_arr is not None:
+            local_weight_arr = unit_weight_arr
+        elif survey_design is not None and survey_design.weights is not None:
+            from diff_diff.survey import _extract_unit_survey_weights
+            local_all_units = sorted(data[unit].unique())
+            local_weight_arr = _extract_unit_survey_weights(
+                data, unit, survey_design, local_all_units
+            )
+        else:
+            local_weight_arr = None
+        # Setup matrices
+        all_units = sorted(data[unit].unique())
+        all_periods = sorted(data[time].unique())
+        n_units = len(all_units)
+        n_periods = len(all_periods)
+        # Vectorized: use pivot for O(1) reshaping instead of O(n) iterrows loop
+        Y = (
+            data.pivot(index=time, columns=unit, values=outcome)
+            .reindex(index=all_periods, columns=all_units)
+            .values
+        )
+        D = (
+            data.pivot(index=time, columns=unit, values=treatment)
+            .reindex(index=all_periods, columns=all_units)
+            .fillna(0)
+            .astype(int)
+            .values
+        )
+        control_mask = D == 0
+        # Get control unit indices
+        unit_ever_treated = np.any(D == 1, axis=0)
+        control_unit_idx = np.where(~unit_ever_treated)[0]
+        # Get list of treated observations
+        treated_observations = [
+            (t, i) for t in range(n_periods) for i in range(n_units) if D[t, i] == 1
+        ]
+        if not treated_observations:
+            raise ValueError("No treated observations")
+        # Compute ATT using observation-specific weights (Algorithm 2)
+        tau_values = []
+        tau_weights = []
+        for t, i in treated_observations:
+            # Skip non-finite outcomes (match main fit NaN contract)
+            if not np.isfinite(Y[t, i]):
+                continue
+            # Compute observation-specific weights for this (i, t)
+            weight_matrix = self._compute_observation_weights(
+                Y, D, i, t, lambda_time, lambda_unit, control_unit_idx, n_units, n_periods
+            )
+            # Fit model with these weights
+            alpha, beta, L = self._estimate_model(
+                Y, control_mask, weight_matrix, lambda_nn, n_units, n_periods
+            )
+            # Compute treatment effect: tau_{it} = Y_{it} - alpha_i - beta_t - L_{it}
+            tau = Y[t, i] - alpha[i] - beta[t] - L[t, i]
+            tau_values.append(tau)
+            if local_weight_arr is not None:
+                tau_weights.append(local_weight_arr[i])
+        if not tau_values:
+            return float("nan")
+        if local_weight_arr is not None:
+            return float(np.average(tau_values, weights=tau_weights))
+        return float(np.mean(tau_values))