PyPI - diff-diff - Versions diffs - 2.9.1__tar.gz → 3.0.0__tar.gz - Mend

diff-diff 2.9.1tar.gz → 3.0.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

{diff_diff-2.9.1 → diff_diff-3.0.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: diff-diff
-Version: 2.9.1
+Version: 3.0.0
 Classifier: Development Status :: 5 - Production/Stable
 Classifier: Intended Audience :: Science/Research
 Classifier: Operating System :: OS Independent

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/__init__.py RENAMED Viewed

@@ -214,7 +214,7 @@ Bacon = BaconDecomposition
 EDiD = EfficientDiD
 ETWFE = WooldridgeDiD
-__version__ = "2.9.1"
+__version__ = "3.0.0"
 __all__ = [
     # Estimators
     "DifferenceInDifferences",

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/linalg.py RENAMED Viewed

@@ -2372,6 +2372,7 @@ def solve_poisson(
     tol: float = 1e-8,
     init_beta: Optional[np.ndarray] = None,
     rank_deficient_action: str = "warn",
+    weights: Optional[np.ndarray] = None,
 ) -> Tuple[np.ndarray, np.ndarray]:
     """Poisson IRLS (Newton-Raphson with log link).
@@ -2389,6 +2390,9 @@ def solve_poisson(
         log(mean(y)) to improve convergence for large-scale outcomes.
     rank_deficient_action : {"warn", "error", "silent"}
         How to handle rank-deficient design matrices. Mirrors solve_ols/solve_logit.
+    weights : (n,) optional observation weights (e.g. survey sampling weights).
+        When provided, the weighted pseudo-log-likelihood is maximised:
+        score = X'(w*(y - mu)), Hessian = X'diag(w*mu)X.
     Returns
     -------
@@ -2397,6 +2401,20 @@ def solve_poisson(
     """
     n, k_orig = X.shape
+    # Validate weights (mirrors solve_logit validation)
+    if weights is not None:
+        weights = np.asarray(weights, dtype=np.float64)
+        if weights.shape != (n,):
+            raise ValueError(f"weights must have shape ({n},), got {weights.shape}")
+        if np.any(np.isnan(weights)):
+            raise ValueError("weights contain NaN values")
+        if np.any(~np.isfinite(weights)):
+            raise ValueError("weights contain Inf values")
+        if np.any(weights < 0):
+            raise ValueError("weights must be non-negative")
+        if np.sum(weights) <= 0:
+            raise ValueError("weights sum to zero — no observations have positive weight")
     # Validate rank_deficient_action (same as solve_logit/solve_ols)
     valid_actions = ("warn", "error", "silent")
     if rank_deficient_action not in valid_actions:
@@ -2425,6 +2443,46 @@ def solve_poisson(
         X = X[:, kept_cols]
     n, k = X.shape
+    # Validate effective weighted sample when weights have zeros
+    # (mirrors solve_logit's positive-weight safeguards)
+    if weights is not None and np.any(weights == 0):
+        pos_mask = weights > 0
+        n_pos = int(np.sum(pos_mask))
+        X_eff = X[pos_mask]
+        eff_rank_info = _detect_rank_deficiency(X_eff)
+        if len(eff_rank_info[1]) > 0:
+            n_dropped_eff = len(eff_rank_info[1])
+            if rank_deficient_action == "error":
+                raise ValueError(
+                    f"Effective (positive-weight) sample is rank-deficient: "
+                    f"{n_dropped_eff} linearly dependent column(s). "
+                    f"Cannot identify Poisson model on this subpopulation."
+                )
+            elif rank_deficient_action == "warn":
+                warnings.warn(
+                    f"Effective (positive-weight) sample is rank-deficient: "
+                    f"dropping {n_dropped_eff} column(s). Poisson estimates "
+                    f"may be unreliable on this subpopulation.",
+                    UserWarning,
+                    stacklevel=2,
+                )
+            eff_dropped = set(int(d) for d in eff_rank_info[1])
+            eff_kept = np.array([i for i in range(k) if i not in eff_dropped])
+            X = X[:, eff_kept]
+            if len(dropped_cols) > 0:
+                kept_cols = kept_cols[eff_kept]
+            else:
+                kept_cols = eff_kept
+                dropped_cols = list(eff_dropped)
+            n, k = X.shape
+        if n_pos <= k:
+            raise ValueError(
+                f"Only {n_pos} positive-weight observation(s) for "
+                f"{k} parameters (after rank reduction). "
+                f"Cannot identify Poisson model."
+            )
     if init_beta is not None:
         beta = init_beta[kept_cols].copy() if len(dropped_cols) > 0 else init_beta.copy()
     else:
@@ -2438,8 +2496,12 @@ def solve_poisson(
     for _ in range(max_iter):
         eta = np.clip(X @ beta, -500, 500)
         mu = np.exp(eta)
-        score = X.T @ (y - mu)  # gradient of log-likelihood
-        hess = X.T @ (mu[:, None] * X)  # -Hessian = X'WX, W=diag(mu)
+        if weights is not None:
+            score = X.T @ (weights * (y - mu))
+            hess = X.T @ ((weights * mu)[:, None] * X)
+        else:
+            score = X.T @ (y - mu)
+            hess = X.T @ (mu[:, None] * X)
         try:
             delta = np.linalg.solve(hess + 1e-12 * np.eye(k), score)
         except np.linalg.LinAlgError:

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/staggered.py RENAMED Viewed

@@ -153,9 +153,6 @@ class CallawaySantAnna(
         - "rademacher": +1/-1 with equal probability (standard choice)
         - "mammen": Two-point distribution (asymptotically valid, matches skewness)
         - "webb": Six-point distribution (recommended when n_clusters < 20)
-    bootstrap_weight_type : str, optional
-        .. deprecated:: 1.0.1
-            Use ``bootstrap_weights`` instead. Will be removed in v3.0.
     seed : int, optional
         Random seed for reproducibility.
     rank_deficient_action : str, default="warn"
@@ -293,7 +290,6 @@ class CallawaySantAnna(
         cluster: Optional[str] = None,
         n_bootstrap: int = 0,
         bootstrap_weights: Optional[str] = None,
-        bootstrap_weight_type: Optional[str] = None,
         seed: Optional[int] = None,
         rank_deficient_action: str = "warn",
         base_period: str = "varying",
@@ -323,18 +319,7 @@ class CallawaySantAnna(
                 f"pscore_fallback must be 'error' or 'unconditional', " f"got '{pscore_fallback}'"
             )
-        # Handle bootstrap_weight_type deprecation
-        if bootstrap_weight_type is not None:
-            warnings.warn(
-                "bootstrap_weight_type is deprecated and will be removed in v3.0. "
-                "Use bootstrap_weights instead.",
-                DeprecationWarning,
-                stacklevel=2,
-            )
-            if bootstrap_weights is None:
-                bootstrap_weights = bootstrap_weight_type
-        # Default to rademacher if neither specified
+        # Default to rademacher if not specified
         if bootstrap_weights is None:
             bootstrap_weights = "rademacher"
@@ -362,8 +347,6 @@ class CallawaySantAnna(
         self.cluster = cluster
         self.n_bootstrap = n_bootstrap
         self.bootstrap_weights = bootstrap_weights
-        # Keep bootstrap_weight_type for backward compatibility
-        self.bootstrap_weight_type = bootstrap_weights
         self.seed = seed
         self.rank_deficient_action = rank_deficient_action
         self.base_period = base_period
@@ -3881,8 +3864,6 @@ class CallawaySantAnna(
             "cluster": self.cluster,
             "n_bootstrap": self.n_bootstrap,
             "bootstrap_weights": self.bootstrap_weights,
-            # Deprecated but kept for backward compatibility
-            "bootstrap_weight_type": self.bootstrap_weight_type,
             "seed": self.seed,
             "rank_deficient_action": self.rank_deficient_action,
             "base_period": self.base_period,

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/staggered_bootstrap.py RENAMED Viewed

@@ -118,7 +118,7 @@ class CallawaySantAnnaBootstrapMixin:
     # Type hints for attributes accessed from the main class
     n_bootstrap: int
-    bootstrap_weight_type: str
+    bootstrap_weights: str
     alpha: float
     seed: Optional[int]
     anticipation: int
@@ -329,7 +329,7 @@ class CallawaySantAnnaBootstrapMixin:
         if _use_survey_bootstrap:
             # PSU-level multiplier weights
             psu_weights, psu_ids = _generate_survey_multiplier_weights_batch(
-                self.n_bootstrap, resolved_survey_unit, self.bootstrap_weight_type, rng
+                self.n_bootstrap, resolved_survey_unit, self.bootstrap_weights, rng
             )
             # Build unit → PSU column map
             if resolved_survey_unit.psu is not None:
@@ -348,7 +348,7 @@ class CallawaySantAnnaBootstrapMixin:
         else:
             # Standard unit-level weights (no survey or weights-only)
             all_bootstrap_weights = _generate_bootstrap_weights_batch(
-                self.n_bootstrap, n_units, self.bootstrap_weight_type, rng
+                self.n_bootstrap, n_units, self.bootstrap_weights, rng
             )
         # Vectorized bootstrap ATT(g,t) computation
@@ -534,7 +534,7 @@ class CallawaySantAnnaBootstrapMixin:
         return CSBootstrapResults(
             n_bootstrap=self.n_bootstrap,
-            weight_type=self.bootstrap_weight_type,
+            weight_type=self.bootstrap_weights,
             alpha=self.alpha,
             overall_att_se=overall_se,
             overall_att_ci=overall_ci,

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/staggered_triple_diff.py RENAMED Viewed

@@ -147,7 +147,6 @@ class StaggeredTripleDifference(
         self.base_period = base_period
         self.n_bootstrap = n_bootstrap
         self.bootstrap_weights = bootstrap_weights
-        self.bootstrap_weight_type = bootstrap_weights
         self.seed = seed
         self.cband = cband
         self.pscore_trim = pscore_trim
@@ -186,7 +185,7 @@ class StaggeredTripleDifference(
                 raise ValueError(f"Unknown parameter: {key}")
             setattr(self, key, value)
         if "bootstrap_weights" in params:
-            self.bootstrap_weight_type = params["bootstrap_weights"]
+            self.bootstrap_weights = params["bootstrap_weights"]
         return self
     # ------------------------------------------------------------------

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/synthetic_did.py RENAMED Viewed

@@ -144,14 +144,14 @@ class SyntheticDiD(DifferenceInDifferences):
             warnings.warn(
                 "lambda_reg is deprecated and ignored. Regularization is now "
                 "auto-computed from data. Use zeta_omega to override unit weight "
-                "regularization.",
+                "regularization. Will be removed in v3.1.",
                 DeprecationWarning,
                 stacklevel=2,
             )
         if zeta is not None:
             warnings.warn(
                 "zeta is deprecated and ignored. Use zeta_lambda to override "
-                "time weight regularization.",
+                "time weight regularization. Will be removed in v3.1.",
                 DeprecationWarning,
                 stacklevel=2,
             )
@@ -1124,7 +1124,8 @@ class SyntheticDiD(DifferenceInDifferences):
         for key, value in params.items():
             if key in _deprecated:
                 warnings.warn(
-                    f"{key} is deprecated and ignored. Use zeta_omega/zeta_lambda " f"instead.",
+                    f"{key} is deprecated and ignored. Use zeta_omega/zeta_lambda "
+                    f"instead. Will be removed in v3.1.",
                     DeprecationWarning,
                     stacklevel=2,
                 )

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/trop.py RENAMED Viewed

@@ -77,10 +77,6 @@ class TROP(TROPLocalMixin, TROPGlobalMixin):
           ATT is the mean of these effects. For the paper's full
           per-treated-cell estimator, use ``method='local'``.
-        - 'twostep': Deprecated alias for 'local'. Will be removed in v3.0.
-        - 'joint': Deprecated alias for 'global'. Will be removed in v3.0.
     lambda_time_grid : list, optional
         Grid of time weight decay parameters. 0.0 = uniform weights (disabled).
         Must not contain inf. Default: [0, 0.1, 0.5, 1, 2, 5].
@@ -140,26 +136,9 @@ class TROP(TROPLocalMixin, TROPGlobalMixin):
         seed: Optional[int] = None,
     ):
         # Validate method parameter
-        # 'local'/'global' are preferred; 'twostep'/'joint' are deprecated aliases
-        valid_methods = ("local", "twostep", "joint", "global")
+        valid_methods = ("local", "global")
         if method not in valid_methods:
             raise ValueError(f"method must be one of {valid_methods}, got '{method}'")
-        if method == "twostep":
-            warnings.warn(
-                "method='twostep' is deprecated and will be removed in v3.0. "
-                "Use method='local' instead.",
-                FutureWarning,
-                stacklevel=2,
-            )
-            method = "local"
-        if method == "joint":
-            warnings.warn(
-                "method='joint' is deprecated and will be removed in v3.0. "
-                "Use method='global' instead.",
-                FutureWarning,
-                stacklevel=2,
-            )
-            method = "global"
         self.method = method
         # Default grids from paper
@@ -913,22 +892,10 @@ class TROP(TROPLocalMixin, TROPGlobalMixin):
     def set_params(self, **params) -> "TROP":
         """Set estimator parameters."""
         for key, value in params.items():
-            if key == "method" and value == "twostep":
-                warnings.warn(
-                    "method='twostep' is deprecated and will be removed in "
-                    "v3.0. Use method='local' instead.",
-                    FutureWarning,
-                    stacklevel=2,
-                )
-                value = "local"
-            if key == "method" and value == "joint":
-                warnings.warn(
-                    "method='joint' is deprecated and will be removed in "
-                    "v3.0. Use method='global' instead.",
-                    FutureWarning,
-                    stacklevel=2,
+            if key == "method" and value not in ("local", "global"):
+                raise ValueError(
+                    f"method must be one of ('local', 'global'), got '{value}'"
                 )
-                value = "global"
             if hasattr(self, key):
                 setattr(self, key, value)
             else:

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/wooldridge.py RENAMED Viewed

@@ -42,6 +42,7 @@ def _compute_weighted_agg(
     gt_keys: List,
     gt_vcov: Optional[np.ndarray],
     alpha: float,
+    df: Optional[int] = None,
 ) -> Dict:
     """Compute simple (overall) weighted average ATT and SE via delta method."""
     post_keys = [(g, t) for (g, t) in gt_keys if t >= g]
@@ -63,10 +64,54 @@ def _compute_weighted_agg(
         else:
             se = float("nan")
-    t_stat, p_value, conf_int = safe_inference(att, se, alpha=alpha)
+    t_stat, p_value, conf_int = safe_inference(att, se, alpha=alpha, df=df)
     return {"att": att, "se": se, "t_stat": t_stat, "p_value": p_value, "conf_int": conf_int}
+def _resolve_survey_for_wooldridge(survey_design, sample, cluster_ids, cluster_name):
+    """Resolve survey design, inject cluster as PSU, recompute metadata.
+    Shared helper for all three WooldridgeDiD sub-fitters.  Matches the
+    resolution chain in DifferenceInDifferences.fit() (estimators.py:344-359).
+    """
+    from diff_diff.survey import (
+        _resolve_survey_for_fit,
+        _resolve_effective_cluster,
+        _inject_cluster_as_psu,
+        compute_survey_metadata,
+    )
+    resolved, survey_weights, survey_weight_type, survey_metadata = (
+        _resolve_survey_for_fit(survey_design, sample)
+    )
+    if resolved is not None and resolved.uses_replicate_variance:
+        raise NotImplementedError(
+            "WooldridgeDiD does not yet support replicate-weight variance. "
+            "Use TSL (strata/PSU/FPC) instead."
+        )
+    if resolved is not None and resolved.weight_type != "pweight":
+        raise ValueError(
+            f"WooldridgeDiD survey support requires weight_type='pweight', "
+            f"got '{resolved.weight_type}'. The survey variance math "
+            f"assumes probability weights (pweight)."
+        )
+    if resolved is not None:
+        effective_cluster = _resolve_effective_cluster(
+            resolved, cluster_ids, cluster_name
+        )
+        if effective_cluster is not None:
+            resolved = _inject_cluster_as_psu(resolved, effective_cluster)
+            if resolved.psu is not None and survey_metadata is not None:
+                raw_w = (
+                    sample[survey_design.weights].values.astype(np.float64)
+                    if survey_design.weights
+                    else np.ones(len(sample), dtype=np.float64)
+                )
+                survey_metadata = compute_survey_metadata(resolved, raw_w)
+    df_inf = resolved.df_survey if resolved is not None else None
+    return resolved, survey_weights, survey_weight_type, survey_metadata, df_inf
 def _filter_sample(
     data: pd.DataFrame,
     unit: str,
@@ -329,6 +374,7 @@ class WooldridgeDiD:
         exovar: Optional[List[str]] = None,
         xtvar: Optional[List[str]] = None,
         xgvar: Optional[List[str]] = None,
+        survey_design=None,
     ) -> WooldridgeDiDResults:
         """Fit the ETWFE model.  See class docstring for parameter details.
@@ -343,6 +389,11 @@ class WooldridgeDiD:
         xtvar : time-varying covariates (demeaned within cohort×period cells
                 when ``demean_covariates=True``)
         xgvar : covariates interacted with each cohort indicator
+        survey_design : SurveyDesign, optional
+            Survey design specification for complex survey data.  Supports
+            stratified, clustered, and weighted designs via Taylor Series
+            Linearization (TSL).  Replicate-weight designs raise
+            ``NotImplementedError``.
         """
         df = data.copy()
         df[cohort] = df[cohort].fillna(0)
@@ -366,6 +417,13 @@ class WooldridgeDiD:
                 f"Set n_bootstrap=0 for analytic SEs."
             )
+        # 0c. Reject bootstrap + survey (no survey-aware bootstrap variant)
+        if self.n_bootstrap > 0 and survey_design is not None:
+            raise ValueError(
+                "Bootstrap inference is not supported with survey_design. "
+                "Set n_bootstrap=0 for analytic survey SEs."
+            )
         # 1. Filter to analysis sample
         sample = _filter_sample(df, unit, time, cohort, self.control_group, self.anticipation)
@@ -502,6 +560,7 @@ class WooldridgeDiD:
                 gt_keys,
                 int_col_names,
                 groups,
+                survey_design=survey_design,
             )
         elif self.method == "logit":
             n_cov_interact = X_cov.shape[1] if X_cov is not None else 0
@@ -517,6 +576,7 @@ class WooldridgeDiD:
                 int_col_names,
                 groups,
                 n_cov_interact=n_cov_interact,
+                survey_design=survey_design,
             )
         else:  # poisson
             n_cov_interact = X_cov.shape[1] if X_cov is not None else 0
@@ -532,6 +592,7 @@ class WooldridgeDiD:
                 int_col_names,
                 groups,
                 n_cov_interact=n_cov_interact,
+                survey_design=survey_design,
             )
         self._results = results
@@ -561,8 +622,21 @@ class WooldridgeDiD:
         gt_keys: List[Tuple],
         int_col_names: List[str],
         groups: List[Any],
+        survey_design=None,
     ) -> WooldridgeDiDResults:
         """OLS path: within-transform FE, solve_ols, cluster SE."""
+        # Reset index so numpy positional indexing matches pandas groupby
+        sample = sample.reset_index(drop=True)
+        # Cluster IDs (default: unit level) — needed before survey resolution
+        cluster_col = self.cluster if self.cluster else unit
+        cluster_ids = sample[cluster_col].values
+        # Resolve survey design, inject cluster as PSU only when user explicitly set cluster=
+        survey_cluster_ids = cluster_ids if self.cluster else None
+        resolved, survey_weights, survey_weight_type, survey_metadata, df_inf = (
+            _resolve_survey_for_wooldridge(survey_design, sample, survey_cluster_ids, self.cluster)
+        )
         # 4. Within-transform: absorb unit + time FE
         all_vars = [outcome] + [f"_x{i}" for i in range(X_design.shape[1])]
         tmp = sample[[unit, time]].copy()
@@ -570,32 +644,60 @@ class WooldridgeDiD:
         for i in range(X_design.shape[1]):
             tmp[f"_x{i}"] = X_design[:, i]
-        # Use uniform weights to trigger iterative alternating projections,
-        # which is exact for both balanced and unbalanced panels.
-        # The one-pass formula (y - ȳ_i - ȳ_t + ȳ) is only exact for balanced panels.
+        # Use iterative alternating projections for demeaning (exact for
+        # both balanced and unbalanced panels).  Survey weights change the
+        # weighted FWL projection — all columns (treatment interactions +
+        # covariates) are demeaned together.
+        wt_weights = survey_weights if survey_weights is not None else np.ones(len(tmp))
+        # Guard: zero-weight unit/time groups cause 0/0 in within_transform
+        if survey_weights is not None and np.any(survey_weights == 0):
+            sw_series = pd.Series(survey_weights, index=sample.index)
+            for grp_col, grp_label in [(unit, "unit"), (time, "time period")]:
+                grp_sums = sw_series.groupby(sample[grp_col]).sum()
+                zero_grps = grp_sums[grp_sums == 0].index.tolist()
+                if zero_grps:
+                    raise ValueError(
+                        f"Survey weights sum to zero for {grp_label}(s) "
+                        f"{zero_grps[:3]}. Cannot compute weighted "
+                        f"within-transformation. Remove zero-weight "
+                        f"{grp_label}s or use non-zero weights."
+                    )
         transformed = within_transform(
             tmp, all_vars, unit=unit, time=time, suffix="_demeaned",
-            weights=np.ones(len(tmp)),
+            weights=wt_weights,
         )
         y = transformed[f"{outcome}_demeaned"].values
         X_cols = [f"_x{i}_demeaned" for i in range(X_design.shape[1])]
         X = transformed[X_cols].values
-        # 5. Cluster IDs (default: unit level)
-        cluster_col = self.cluster if self.cluster else unit
-        cluster_ids = sample[cluster_col].values
-        # 6. Solve OLS
+        # 6. Solve OLS (skip cluster-robust vcov when survey will provide TSL vcov)
         coefs, resids, vcov = solve_ols(
             X,
             y,
             cluster_ids=cluster_ids,
-            return_vcov=True,
+            return_vcov=(resolved is None),
             rank_deficient_action=self.rank_deficient_action,
             column_names=col_names,
+            weights=survey_weights,
+            weight_type=survey_weight_type,
         )
+        # Survey TSL vcov replaces cluster-robust vcov
+        if resolved is not None:
+            from diff_diff.survey import compute_survey_vcov
+            nan_mask_ols = np.isnan(coefs)
+            if np.any(nan_mask_ols):
+                kept = ~nan_mask_ols
+                vcov_kept = compute_survey_vcov(X[:, kept], resids, resolved)
+                vcov = np.full((len(coefs), len(coefs)), np.nan)
+                kept_idx = np.where(kept)[0]
+                vcov[np.ix_(kept_idx, kept_idx)] = vcov_kept
+            else:
+                vcov = compute_survey_vcov(X, resids, resolved)
         # 7. Extract β_{g,t} and build gt_effects dict
         gt_effects: Dict[Tuple, Dict] = {}
         gt_weights: Dict[Tuple, int] = {}
@@ -607,7 +709,7 @@ class WooldridgeDiD:
                 continue
             att = float(coefs[idx])
             se = float(np.sqrt(max(vcov[idx, idx], 0.0))) if vcov is not None else float("nan")
-            t_stat, p_value, conf_int = safe_inference(att, se, alpha=self.alpha)
+            t_stat, p_value, conf_int = safe_inference(att, se, alpha=self.alpha, df=df_inf)
             gt_effects[(g, t)] = {
                 "att": att,
                 "se": se,
@@ -628,7 +730,7 @@ class WooldridgeDiD:
         # 8. Simple aggregation (always computed)
         overall = _compute_weighted_agg(
-            gt_effects, gt_weights, gt_keys_ordered, gt_vcov, self.alpha
+            gt_effects, gt_weights, gt_keys_ordered, gt_vcov, self.alpha, df=df_inf
         )
         # Metadata
@@ -652,9 +754,11 @@ class WooldridgeDiD:
             n_control_units=n_control,
             alpha=self.alpha,
             anticipation=self.anticipation,
+            survey_metadata=survey_metadata,
             _gt_weights=gt_weights,
             _gt_vcov=gt_vcov,
             _gt_keys=gt_keys_ordered,
+            _df_survey=df_inf,
         )
         # 9. Optional multiplier bootstrap (overrides analytic SE for overall ATT)
@@ -723,6 +827,7 @@ class WooldridgeDiD:
         int_col_names: List[str],
         groups: List[Any],
         n_cov_interact: int = 0,
+        survey_design=None,
     ) -> WooldridgeDiDResults:
         """Logit path: cohort + time additive FEs + solve_logit + ASF ATT.
@@ -749,10 +854,18 @@ class WooldridgeDiD:
         cluster_col = self.cluster if self.cluster else unit
         cluster_ids = sample[cluster_col].values
+        # Resolve survey design, inject cluster as PSU only when user explicitly set cluster=
+        survey_cluster_ids = cluster_ids if self.cluster else None
+        resolved, survey_weights, survey_weight_type, survey_metadata, df_inf = (
+            _resolve_survey_for_wooldridge(survey_design, sample, survey_cluster_ids, self.cluster)
+        )
+        _has_survey = resolved is not None
         beta, probs = solve_logit(
             X_full,
             y,
             rank_deficient_action=self.rank_deficient_action,
+            weights=survey_weights,
         )
         # solve_logit prepends intercept — beta[0] is intercept, beta[1:] are X_full cols
         beta_int_cols = beta[1 : n_int + 1]  # treatment interaction coefficients
@@ -763,34 +876,65 @@ class WooldridgeDiD:
         beta_clean = np.where(nan_mask, 0.0, beta)
         kept_beta = ~nan_mask
-        # QMLE sandwich vcov via shared linalg backend
+        # QMLE sandwich vcov
         resids = y - probs
         X_with_intercept = np.column_stack([np.ones(len(y)), X_full])
-        if np.any(nan_mask):
-            # Compute vcov on reduced design (only identified columns)
-            X_reduced = X_with_intercept[:, kept_beta]
-            vcov_reduced = compute_robust_vcov(
-                X_reduced,
-                resids,
-                cluster_ids=cluster_ids,
-                weights=probs * (1 - probs),
-                weight_type="aweight",
-            )
-            # Expand back to full size with NaN for dropped columns
-            k_full = len(beta)
-            vcov_full = np.full((k_full, k_full), np.nan)
-            kept_idx = np.where(kept_beta)[0]
-            vcov_full[np.ix_(kept_idx, kept_idx)] = vcov_reduced
+        if _has_survey:
+            # X_tilde trick: transform design matrix so compute_survey_vcov
+            # produces the correct QMLE sandwich for nonlinear models.
+            # Bread: (X_tilde'WX_tilde)^{-1} = (X'diag(w*V)X)^{-1}
+            # Scores: w*X_tilde*r_tilde = w*X*(y-mu)
+            from diff_diff.survey import compute_survey_vcov
+            V = probs * (1 - probs)
+            sqrt_V = np.sqrt(np.clip(V, 1e-20, None))
+            X_tilde = X_with_intercept * sqrt_V[:, None]
+            r_tilde = resids / sqrt_V
+            if np.any(nan_mask):
+                X_tilde_r = X_tilde[:, kept_beta]
+                vcov_reduced = compute_survey_vcov(X_tilde_r, r_tilde, resolved)
+                k_full = len(beta)
+                vcov_full = np.full((k_full, k_full), np.nan)
+                kept_idx = np.where(kept_beta)[0]
+                vcov_full[np.ix_(kept_idx, kept_idx)] = vcov_reduced
+            else:
+                vcov_full = compute_survey_vcov(X_tilde, r_tilde, resolved)
         else:
-            vcov_full = compute_robust_vcov(
-                X_with_intercept,
-                resids,
-                cluster_ids=cluster_ids,
-                weights=probs * (1 - probs),
-                weight_type="aweight",
-            )
+            # Cluster-robust QMLE sandwich (non-survey path)
+            if np.any(nan_mask):
+                X_reduced = X_with_intercept[:, kept_beta]
+                vcov_reduced = compute_robust_vcov(
+                    X_reduced,
+                    resids,
+                    cluster_ids=cluster_ids,
+                    weights=probs * (1 - probs),
+                    weight_type="aweight",
+                )
+                k_full = len(beta)
+                vcov_full = np.full((k_full, k_full), np.nan)
+                kept_idx = np.where(kept_beta)[0]
+                vcov_full[np.ix_(kept_idx, kept_idx)] = vcov_reduced
+            else:
+                vcov_full = compute_robust_vcov(
+                    X_with_intercept,
+                    resids,
+                    cluster_ids=cluster_ids,
+                    weights=probs * (1 - probs),
+                    weight_type="aweight",
+                )
         beta = beta_clean
+        # Survey-weighted averaging helpers for ASF computation
+        def _avg(a, cell_mask):
+            if survey_weights is not None:
+                return float(np.average(a, weights=survey_weights[cell_mask]))
+            return float(np.mean(a))
+        def _avg_ax0(a, cell_mask):
+            if survey_weights is not None:
+                return np.average(a, weights=survey_weights[cell_mask], axis=0)
+            return np.mean(a, axis=0)
         # ASF ATT(g,t) for treated units in each cell
         gt_effects: Dict[Tuple, Dict] = {}
         gt_weights: Dict[Tuple, int] = {}
@@ -802,6 +946,9 @@ class WooldridgeDiD:
             if cell_mask.sum() == 0:
                 continue
             # Skip cells whose interaction coefficient was dropped (rank deficiency)
+            # Skip cells where all survey weights are zero (non-estimable)
+            if survey_weights is not None and np.sum(survey_weights[cell_mask]) == 0:
+                continue
             delta = beta_int_cols[idx]
             if np.isnan(delta):
                 continue
@@ -816,26 +963,26 @@ class WooldridgeDiD:
                     x_hat_j = X_with_intercept[cell_mask, coef_pos]
                     delta_total = delta_total + beta[coef_pos] * x_hat_j
             eta_0 = eta_base - delta_total
-            att = float(np.mean(_logistic(eta_base) - _logistic(eta_0)))
+            att = _avg(_logistic(eta_base) - _logistic(eta_0), cell_mask)
             # Delta method gradient: d(ATT)/d(β)
             #   for nuisance p: mean_i[(Λ'(η_1) - Λ'(η_0)) * X_p]
             #   for cell intercept: mean_i[Λ'(η_1)]
             #   for cell × cov j: mean_i[Λ'(η_1) * x_hat_j]
             d_diff = _logistic_deriv(eta_base) - _logistic_deriv(eta_0)
-            grad = np.mean(X_with_intercept[cell_mask] * d_diff[:, None], axis=0)
-            grad[1 + idx] = float(np.mean(_logistic_deriv(eta_base)))
+            grad = _avg_ax0(X_with_intercept[cell_mask] * d_diff[:, None], cell_mask)
+            grad[1 + idx] = _avg(_logistic_deriv(eta_base), cell_mask)
             for j in range(n_cov_interact):
                 coef_pos = 1 + n_int + idx * n_cov_interact + j
                 if coef_pos < len(beta):
                     x_hat_j = X_with_intercept[cell_mask, coef_pos]
-                    grad[coef_pos] = float(np.mean(_logistic_deriv(eta_base) * x_hat_j))
+                    grad[coef_pos] = _avg(_logistic_deriv(eta_base) * x_hat_j, cell_mask)
             # Compute SE in reduced parameter space if rank-deficient
             if np.any(nan_mask):
                 grad_r = grad[kept_beta]
                 se = float(np.sqrt(max(grad_r @ vcov_reduced @ grad_r, 0.0)))
             else:
                 se = float(np.sqrt(max(grad @ vcov_full @ grad, 0.0)))
-            t_stat, p_value, conf_int = safe_inference(att, se, alpha=self.alpha)
+            t_stat, p_value, conf_int = safe_inference(att, se, alpha=self.alpha, df=df_inf)
             gt_effects[(g, t)] = {
                 "att": att,
                 "se": se,
@@ -864,7 +1011,7 @@ class WooldridgeDiD:
             overall_att = sum(gt_weights[k] * gt_effects[k]["att"] for k in post_keys) / w_total
             agg_grad = sum((gt_weights[k] / w_total) * gt_grads[k] for k in post_keys)
             overall_se = float(np.sqrt(max(agg_grad @ _vcov_se @ agg_grad, 0.0)))
-            t_stat, p_value, conf_int = safe_inference(overall_att, overall_se, alpha=self.alpha)
+            t_stat, p_value, conf_int = safe_inference(overall_att, overall_se, alpha=self.alpha, df=df_inf)
             overall = {
                 "att": overall_att,
                 "se": overall_se,
@@ -874,7 +1021,7 @@ class WooldridgeDiD:
             }
         else:
             overall = _compute_weighted_agg(
-                gt_effects, gt_weights, gt_keys_ordered, None, self.alpha
+                gt_effects, gt_weights, gt_keys_ordered, None, self.alpha, df=df_inf
             )
         return WooldridgeDiDResults(
@@ -893,9 +1040,11 @@ class WooldridgeDiD:
             n_control_units=self._count_control_units(sample, unit, cohort, time),
             alpha=self.alpha,
             anticipation=self.anticipation,
+            survey_metadata=survey_metadata,
             _gt_weights=gt_weights,
             _gt_vcov=gt_vcov,
             _gt_keys=gt_keys_ordered,
+            _df_survey=df_inf,
         )
     def _fit_poisson(
@@ -911,6 +1060,7 @@ class WooldridgeDiD:
         int_col_names: List[str],
         groups: List[Any],
         n_cov_interact: int = 0,
+        survey_design=None,
     ) -> WooldridgeDiDResults:
         """Poisson path: cohort + time additive FEs + solve_poisson + ASF ATT.
@@ -940,7 +1090,18 @@ class WooldridgeDiD:
         cluster_col = self.cluster if self.cluster else unit
         cluster_ids = sample[cluster_col].values
-        beta, mu_hat = solve_poisson(X_full, y, rank_deficient_action=self.rank_deficient_action)
+        # Resolve survey design, inject cluster as PSU only when user explicitly set cluster=
+        survey_cluster_ids = cluster_ids if self.cluster else None
+        resolved, survey_weights, survey_weight_type, survey_metadata, df_inf = (
+            _resolve_survey_for_wooldridge(survey_design, sample, survey_cluster_ids, self.cluster)
+        )
+        _has_survey = resolved is not None
+        beta, mu_hat = solve_poisson(
+            X_full, y,
+            rank_deficient_action=self.rank_deficient_action,
+            weights=survey_weights,
+        )
         # Handle rank-deficient designs: compute vcov on reduced design.
         # Preserve raw interaction coefficients BEFORE zeroing NaN so the
@@ -950,34 +1111,63 @@ class WooldridgeDiD:
         beta_clean = np.where(nan_mask, 0.0, beta)
         kept_beta = ~nan_mask
-        # QMLE sandwich vcov via shared linalg backend
+        # QMLE sandwich vcov
         resids = y - mu_hat
-        if np.any(nan_mask):
-            X_reduced = X_full[:, kept_beta]
-            vcov_reduced = compute_robust_vcov(
-                X_reduced,
-                resids,
-                cluster_ids=cluster_ids,
-                weights=mu_hat,
-                weight_type="aweight",
-            )
-            k_full = len(beta)
-            vcov_full = np.full((k_full, k_full), np.nan)
-            kept_idx = np.where(kept_beta)[0]
-            vcov_full[np.ix_(kept_idx, kept_idx)] = vcov_reduced
+        if _has_survey:
+            # X_tilde trick for nonlinear survey vcov (V = mu for Poisson)
+            from diff_diff.survey import compute_survey_vcov
+            sqrt_V = np.sqrt(np.clip(mu_hat, 1e-20, None))
+            X_tilde = X_full * sqrt_V[:, None]
+            r_tilde = resids / sqrt_V
+            if np.any(nan_mask):
+                X_tilde_r = X_tilde[:, kept_beta]
+                vcov_reduced = compute_survey_vcov(X_tilde_r, r_tilde, resolved)
+                k_full = len(beta)
+                vcov_full = np.full((k_full, k_full), np.nan)
+                kept_idx = np.where(kept_beta)[0]
+                vcov_full[np.ix_(kept_idx, kept_idx)] = vcov_reduced
+            else:
+                vcov_full = compute_survey_vcov(X_tilde, r_tilde, resolved)
         else:
-            vcov_full = compute_robust_vcov(
-                X_full,
-                resids,
-                cluster_ids=cluster_ids,
-                weights=mu_hat,
-                weight_type="aweight",
-            )
+            # Cluster-robust QMLE sandwich (non-survey path)
+            if np.any(nan_mask):
+                X_reduced = X_full[:, kept_beta]
+                vcov_reduced = compute_robust_vcov(
+                    X_reduced,
+                    resids,
+                    cluster_ids=cluster_ids,
+                    weights=mu_hat,
+                    weight_type="aweight",
+                )
+                k_full = len(beta)
+                vcov_full = np.full((k_full, k_full), np.nan)
+                kept_idx = np.where(kept_beta)[0]
+                vcov_full[np.ix_(kept_idx, kept_idx)] = vcov_reduced
+            else:
+                vcov_full = compute_robust_vcov(
+                    X_full,
+                    resids,
+                    cluster_ids=cluster_ids,
+                    weights=mu_hat,
+                    weight_type="aweight",
+                )
         beta = beta_clean
         # Treatment interaction coefficients (from cleaned beta for computation)
         beta_int = beta[1 : 1 + n_int]
+        # Survey-weighted averaging helpers for ASF computation
+        def _avg(a, cell_mask):
+            if survey_weights is not None:
+                return float(np.average(a, weights=survey_weights[cell_mask]))
+            return float(np.mean(a))
+        def _avg_ax0(a, cell_mask):
+            if survey_weights is not None:
+                return np.average(a, weights=survey_weights[cell_mask], axis=0)
+            return np.mean(a, axis=0)
         # ASF ATT(g,t) for treated units in each cell.
         # eta_base = X_full @ beta already includes the treatment effect (D_{g,t}=1).
         # Counterfactual: eta_0 = eta_base - delta  (treatment switched off).
@@ -995,6 +1185,9 @@ class WooldridgeDiD:
             # Use raw coefficients (before NaN->0 zeroing) to detect dropped cells.
             if np.isnan(beta_int_raw[idx]):
                 continue
+            # Skip cells where all survey weights are zero (non-estimable)
+            if survey_weights is not None and np.sum(survey_weights[cell_mask]) == 0:
+                continue
             delta = beta_int[idx]
             if np.isnan(delta):
                 continue
@@ -1009,26 +1202,26 @@ class WooldridgeDiD:
             eta_0 = eta_base - delta_total
             mu_1 = np.exp(eta_base)
             mu_0 = np.exp(eta_0)
-            att = float(np.mean(mu_1 - mu_0))
+            att = _avg(mu_1 - mu_0, cell_mask)
             # Delta method gradient:
             #   for nuisance p: mean_i[(μ_1 - μ_0) * X_p]
             #   for cell intercept: mean_i[μ_1]
             #   for cell × cov j: mean_i[μ_1 * x_hat_j]
             diff_mu = mu_1 - mu_0
-            grad = np.mean(X_full[cell_mask] * diff_mu[:, None], axis=0)
-            grad[1 + idx] = float(np.mean(mu_1))
+            grad = _avg_ax0(X_full[cell_mask] * diff_mu[:, None], cell_mask)
+            grad[1 + idx] = _avg(mu_1, cell_mask)
             for j in range(n_cov_interact):
                 coef_pos = 1 + n_int + idx * n_cov_interact + j
                 if coef_pos < len(beta):
                     x_hat_j = X_full[cell_mask, coef_pos]
-                    grad[coef_pos] = float(np.mean(mu_1 * x_hat_j))
+                    grad[coef_pos] = _avg(mu_1 * x_hat_j, cell_mask)
             # Compute SE in reduced parameter space if rank-deficient
             if np.any(nan_mask):
                 grad_r = grad[kept_beta]
                 se = float(np.sqrt(max(grad_r @ vcov_reduced @ grad_r, 0.0)))
             else:
                 se = float(np.sqrt(max(grad @ vcov_full @ grad, 0.0)))
-            t_stat, p_value, conf_int = safe_inference(att, se, alpha=self.alpha)
+            t_stat, p_value, conf_int = safe_inference(att, se, alpha=self.alpha, df=df_inf)
             gt_effects[(g, t)] = {
                 "att": att,
                 "se": se,
@@ -1055,7 +1248,7 @@ class WooldridgeDiD:
             overall_att = sum(gt_weights[k] * gt_effects[k]["att"] for k in post_keys) / w_total
             agg_grad = sum((gt_weights[k] / w_total) * gt_grads[k] for k in post_keys)
             overall_se = float(np.sqrt(max(agg_grad @ _vcov_se @ agg_grad, 0.0)))
-            t_stat, p_value, conf_int = safe_inference(overall_att, overall_se, alpha=self.alpha)
+            t_stat, p_value, conf_int = safe_inference(overall_att, overall_se, alpha=self.alpha, df=df_inf)
             overall = {
                 "att": overall_att,
                 "se": overall_se,
@@ -1065,7 +1258,7 @@ class WooldridgeDiD:
             }
         else:
             overall = _compute_weighted_agg(
-                gt_effects, gt_weights, gt_keys_ordered, None, self.alpha
+                gt_effects, gt_weights, gt_keys_ordered, None, self.alpha, df=df_inf
             )
         return WooldridgeDiDResults(
@@ -1084,7 +1277,9 @@ class WooldridgeDiD:
             n_control_units=self._count_control_units(sample, unit, cohort, time),
             alpha=self.alpha,
             anticipation=self.anticipation,
+            survey_metadata=survey_metadata,
             _gt_weights=gt_weights,
             _gt_vcov=gt_vcov,
             _gt_keys=gt_keys_ordered,
+            _df_survey=df_inf,
         )

{diff_diff-2.9.1 → diff_diff-3.0.0}/diff_diff/wooldridge_results.py RENAMED Viewed

@@ -54,6 +54,7 @@ class WooldridgeDiDResults:
     n_control_units: int = 0
     alpha: float = 0.05
     anticipation: int = 0
+    survey_metadata: Optional[Any] = field(default=None, repr=False)
     # ------------------------------------------------------------------ #
     # Internal — used by aggregate() for delta-method SEs                 #
@@ -63,6 +64,8 @@ class WooldridgeDiDResults:
     """Full vcov of all β_{g,t} coefficients (ordered same as sorted group_time_effects keys)."""
     _gt_keys: List[Tuple[Any, Any]] = field(default_factory=list, repr=False)
     """Ordered list of (g,t) keys corresponding to _gt_vcov columns."""
+    _df_survey: Optional[int] = field(default=None, repr=False)
+    """Survey degrees of freedom for t-distribution inference."""
     # ------------------------------------------------------------------ #
     # Public methods                                                      #
@@ -93,7 +96,7 @@ class WooldridgeDiDResults:
             return float(np.sqrt(max(w_vec @ vcov @ w_vec, 0.0)))
         def _build_effect(att: float, se: float) -> Dict[str, Any]:
-            t_stat, p_value, conf_int = safe_inference(att, se, alpha=self.alpha)
+            t_stat, p_value, conf_int = safe_inference(att, se, alpha=self.alpha, df=self._df_survey)
             return {
                 "att": att,
                 "se": se,
@@ -181,6 +184,11 @@ class WooldridgeDiDResults:
             "-" * 70,
         ]
+        if self.survey_metadata is not None:
+            from diff_diff.results import _format_survey_block
+            lines.extend(_format_survey_block(self.survey_metadata, 70))
+            lines.append("-" * 70)
         def _fmt_row(label: str, att: float, se: float, t: float, p: float, ci: Tuple) -> str:
             from diff_diff.results import _get_significance_stars  # type: ignore

{diff_diff-2.9.1 → diff_diff-3.0.0}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "maturin"
 [project]
 name = "diff-diff"
-version = "2.9.1"
+version = "3.0.0"
 description = "Difference-in-Differences causal inference with sklearn-like API. Callaway-Sant'Anna, Synthetic DiD, Honest DiD, event studies, parallel trends."
 readme = "README.md"
 license = "MIT"

{diff_diff-2.9.1 → diff_diff-3.0.0}/rust/Cargo.lock RENAMED Viewed

@@ -197,7 +197,7 @@ checksum = "930c7171c8df9fb1782bdf9b918ed9ed2d33d1d22300abb754f9085bc48bf8e8"
 [[package]]
 name = "diff_diff_rust"
-version = "2.9.1"
+version = "3.0.0"
 dependencies = [
  "blas-src",
  "faer",

{diff_diff-2.9.1 → diff_diff-3.0.0}/rust/Cargo.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [package]
 name = "diff_diff_rust"
-version = "2.9.1"
+version = "3.0.0"
 edition = "2021"
 description = "Rust backend for diff-diff DiD library"
 license = "MIT"