PyPI - diff-diff - Versions diffs - 2.2.0__tar.gz → 2.3.0__tar.gz - Mend

diff-diff 2.2.0tar.gz → 2.3.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (35) hide show

{diff_diff-2.2.0 → diff_diff-2.3.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: diff-diff
-Version: 2.2.0
+Version: 2.3.0
 Classifier: Development Status :: 5 - Production/Stable
 Classifier: Intended Audience :: Science/Research
 Classifier: Operating System :: OS Independent
@@ -14,10 +14,12 @@ Requires-Dist: numpy>=1.20.0
 Requires-Dist: pandas>=1.3.0
 Requires-Dist: scipy>=1.7.0
 Requires-Dist: pytest>=7.0 ; extra == 'dev'
+Requires-Dist: pytest-xdist>=3.0 ; extra == 'dev'
 Requires-Dist: pytest-cov>=4.0 ; extra == 'dev'
 Requires-Dist: black>=23.0 ; extra == 'dev'
 Requires-Dist: ruff>=0.1.0 ; extra == 'dev'
 Requires-Dist: mypy>=1.0 ; extra == 'dev'
+Requires-Dist: maturin>=1.4,<2.0 ; extra == 'dev'
 Requires-Dist: sphinx>=6.0 ; extra == 'docs'
 Requires-Dist: sphinx-rtd-theme>=1.0 ; extra == 'docs'
 Provides-Extra: dev
@@ -105,7 +107,7 @@ Signif. codes: '***' 0.001, '**' 0.01, '*' 0.05, '.' 0.1
 - **Wild cluster bootstrap**: Valid inference with few clusters (<50) using Rademacher, Webb, or Mammen weights
 - **Panel data support**: Two-way fixed effects estimator for panel designs
 - **Multi-period analysis**: Event-study style DiD with period-specific treatment effects
-- **Staggered adoption**: Callaway-Sant'Anna (2021) and Sun-Abraham (2021) estimators for heterogeneous treatment timing
+- **Staggered adoption**: Callaway-Sant'Anna (2021), Sun-Abraham (2021), and Borusyak-Jaravel-Spiess (2024) imputation estimators for heterogeneous treatment timing
 - **Triple Difference (DDD)**: Ortiz-Villavicencio & Sant'Anna (2025) estimators with proper covariate handling
 - **Synthetic DiD**: Combined DiD with synthetic control for improved robustness
 - **Triply Robust Panel (TROP)**: Factor-adjusted DiD with synthetic weights (Athey et al. 2025)
@@ -596,12 +598,13 @@ results = twfe.fit(
 ### Multi-Period DiD (Event Study)
-For settings with multiple pre- and post-treatment periods:
+For settings with multiple pre- and post-treatment periods. Estimates treatment × period
+interactions for ALL periods (pre and post), enabling parallel trends assessment:
 ```python
 from diff_diff import MultiPeriodDiD
-# Fit with multiple time periods
+# Fit full event study with pre and post period effects
 did = MultiPeriodDiD()
 results = did.fit(
     panel_data,
@@ -609,18 +612,23 @@ results = did.fit(
     treatment='treated',
     time='period',
     post_periods=[3, 4, 5],      # Periods 3-5 are post-treatment
-    reference_period=0           # Reference period for comparison
+    reference_period=2,          # Last pre-period (e=-1 convention)
+    unit='unit_id',              # Optional: warns if staggered adoption detected
 )
-# View period-specific treatment effects
-for period, effect in results.period_effects.items():
-    print(f"Period {period}: {effect.effect:.3f} (SE: {effect.se:.3f})")
+# Pre-period effects test parallel trends (should be ≈ 0)
+for period, effect in results.pre_period_effects.items():
+    print(f"Pre {period}: {effect.effect:.3f} (SE: {effect.se:.3f})")
+# Post-period effects estimate dynamic treatment effects
+for period, effect in results.post_period_effects.items():
+    print(f"Post {period}: {effect.effect:.3f} (SE: {effect.se:.3f})")
 # View average treatment effect across post-periods
 print(f"Average ATT: {results.avg_att:.3f}")
 print(f"Average SE: {results.avg_se:.3f}")
-# Full summary with all period effects
+# Full summary with pre and post period effects
 results.print_summary()
 ```
@@ -908,6 +916,54 @@ print(f"Sun-Abraham ATT: {sa_results.overall_att:.3f}")
 # If results differ substantially, investigate heterogeneity
 ```
+### Borusyak-Jaravel-Spiess Imputation Estimator
+The Borusyak et al. (2024) imputation estimator is the **efficient** estimator for staggered DiD under parallel trends, producing ~50% shorter confidence intervals than Callaway-Sant'Anna and 2-3.5x shorter than Sun-Abraham under homogeneous treatment effects.
+```python
+from diff_diff import ImputationDiD, imputation_did
+# Basic usage
+est = ImputationDiD()
+results = est.fit(data, outcome='outcome', unit='unit',
+                  time='period', first_treat='first_treat')
+results.print_summary()
+# Event study
+results = est.fit(data, outcome='outcome', unit='unit',
+                  time='period', first_treat='first_treat',
+                  aggregate='event_study')
+# Pre-trend test (Equation 9)
+pt = results.pretrend_test(n_leads=3)
+print(f"F-stat: {pt['f_stat']:.3f}, p-value: {pt['p_value']:.4f}")
+# Convenience function
+results = imputation_did(data, 'outcome', 'unit', 'period', 'first_treat',
+                         aggregate='all')
+```
+```python
+ImputationDiD(
+    anticipation=0,         # Number of anticipation periods
+    alpha=0.05,             # Significance level
+    cluster=None,           # Cluster variable (defaults to unit)
+    n_bootstrap=0,          # Bootstrap iterations (0=analytical inference)
+    seed=None,              # Random seed
+    horizon_max=None,       # Max event-study horizon
+    aux_partition="cohort_horizon",  # Variance partition: "cohort_horizon", "cohort", "horizon"
+)
+```
+**When to use Imputation DiD vs Callaway-Sant'Anna:**
+| Aspect | Imputation DiD | Callaway-Sant'Anna |
+|--------|---------------|-------------------|
+| Efficiency | Most efficient under homogeneous effects | Less efficient but more robust to heterogeneity |
+| Control group | Always uses all untreated obs | Choice of never-treated or not-yet-treated |
+| Inference | Conservative variance (Theorem 3) | Multiplier bootstrap |
+| Pre-trends | Built-in F-test (Equation 9) | Separate testing |
 ### Triple Difference (DDD)
 Triple Difference (DDD) is used when treatment requires satisfying two criteria: belonging to a treated **group** AND being in an eligible **partition**. The `TripleDifference` class implements the methodology from Ortiz-Villavicencio & Sant'Anna (2025), which correctly handles covariate adjustment (unlike naive implementations).
@@ -986,10 +1042,10 @@ Create publication-ready event study plots:
 ```python
 from diff_diff import plot_event_study, MultiPeriodDiD, CallawaySantAnna, SunAbraham
-# From MultiPeriodDiD
+# From MultiPeriodDiD (full event study with pre and post period effects)
 did = MultiPeriodDiD()
 results = did.fit(data, outcome='y', treatment='treated',
-                  time='period', post_periods=[3, 4, 5])
+                  time='period', post_periods=[3, 4, 5], reference_period=2)
 plot_event_study(results, title="Treatment Effects Over Time")
 # From CallawaySantAnna (with event study aggregation)
@@ -1309,7 +1365,6 @@ TROP(
     max_iter=100,               # Max iterations for factor estimation
     tol=1e-6,                   # Convergence tolerance
     alpha=0.05,                 # Significance level
-    variance_method='bootstrap', # 'bootstrap' or 'jackknife'
     n_bootstrap=200,            # Bootstrap replications
     seed=None                   # Random seed
 )
@@ -1449,14 +1504,15 @@ Pre-trends tests have low power and can exacerbate bias. **Honest DiD** (Rambach
 ```python
 from diff_diff import HonestDiD, MultiPeriodDiD
-# First, fit a standard event study
+# First, fit a full event study (pre + post period effects)
 did = MultiPeriodDiD()
 event_results = did.fit(
     data,
     outcome='outcome',
     treatment='treated',
     time='period',
-    post_periods=[5, 6, 7, 8, 9]
+    post_periods=[5, 6, 7, 8, 9],
+    reference_period=4,          # Last pre-period (e=-1 convention)
 )
 # Compute honest bounds with relative magnitudes restriction
@@ -1524,14 +1580,15 @@ A passing pre-trends test doesn't mean parallel trends holds—it may just mean
 ```python
 from diff_diff import PreTrendsPower, MultiPeriodDiD
-# First, fit an event study
+# First, fit a full event study
 did = MultiPeriodDiD()
 event_results = did.fit(
     data,
     outcome='outcome',
     treatment='treated',
     time='period',
-    post_periods=[5, 6, 7, 8, 9]
+    post_periods=[5, 6, 7, 8, 9],
+    reference_period=4,
 )
 # Analyze pre-trends test power
@@ -1800,7 +1857,8 @@ MultiPeriodDiD(
 | `covariates` | list | Linear control variables |
 | `fixed_effects` | list | Categorical FE columns (creates dummies) |
 | `absorb` | list | High-dimensional FE (within-transformation) |
-| `reference_period` | any | Omitted period for time dummies |
+| `reference_period` | any | Omitted period (default: last pre-period, e=-1 convention) |
+| `unit` | str | Unit identifier column (for staggered adoption warning) |
 ### MultiPeriodDiDResults
@@ -1808,8 +1866,8 @@ MultiPeriodDiD(
 | Attribute | Description |
 |-----------|-------------|
-| `period_effects` | Dict mapping periods to PeriodEffect objects |
-| `avg_att` | Average ATT across post-treatment periods |
+| `period_effects` | Dict mapping periods to PeriodEffect objects (pre and post, excluding reference) |
+| `avg_att` | Average ATT across post-treatment periods only |
 | `avg_se` | Standard error of average ATT |
 | `avg_t_stat` | T-statistic for average ATT |
 | `avg_p_value` | P-value for average ATT |
@@ -1817,6 +1875,10 @@ MultiPeriodDiD(
 | `n_obs` | Number of observations |
 | `pre_periods` | List of pre-treatment periods |
 | `post_periods` | List of post-treatment periods |
+| `reference_period` | The omitted reference period (coefficient = 0 by construction) |
+| `interaction_indices` | Dict mapping period → column index in VCV (for sub-VCV extraction) |
+| `pre_period_effects` | Property: pre-period effects only (for parallel trends assessment) |
+| `post_period_effects` | Property: post-period effects only |
 **Methods:**
@@ -1909,8 +1971,7 @@ TROP(
     max_iter=100,              # Max iterations for factor estimation
     tol=1e-6,                  # Convergence tolerance
     alpha=0.05,                # Significance level for CIs
-    variance_method='bootstrap',  # 'bootstrap' or 'jackknife'
-    n_bootstrap=200,           # Bootstrap/jackknife iterations
+    n_bootstrap=200,           # Bootstrap replications
     seed=None                  # Random seed
 )
 ```
@@ -1934,7 +1995,7 @@ Note: TROP infers treatment periods from the treatment indicator column. The tre
 | Attribute | Description |
 |-----------|-------------|
 | `att` | Average Treatment effect on the Treated |
-| `se` | Standard error (bootstrap or jackknife) |
+| `se` | Standard error (bootstrap) |
 | `t_stat` | T-statistic |
 | `p_value` | P-value |
 | `conf_int` | Confidence interval |
@@ -1953,7 +2014,6 @@ Note: TROP infers treatment periods from the treatment indicator column. The tre
 | `loocv_score` | LOOCV score for selected parameters |
 | `n_pre_periods` | Number of pre-treatment periods |
 | `n_post_periods` | Number of post-treatment periods |
-| `variance_method` | Variance estimation method |
 | `bootstrap_distribution` | Bootstrap distribution (if bootstrap) |
 **Methods:**
@@ -2025,6 +2085,60 @@ SunAbraham(
 | `print_summary(alpha)` | Print summary to stdout |
 | `to_dataframe(level)` | Convert to DataFrame ('event_study' or 'cohort') |
+### ImputationDiD
+```python
+ImputationDiD(
+    anticipation=0,                   # Periods of anticipation effects
+    alpha=0.05,                       # Significance level for CIs
+    cluster=None,                     # Column for cluster-robust SEs
+    n_bootstrap=0,                    # Bootstrap iterations (0 = analytical)
+    seed=None,                        # Random seed
+    rank_deficient_action='warn',     # 'warn', 'error', or 'silent'
+    horizon_max=None,                 # Max event-study horizon
+    aux_partition='cohort_horizon',   # Variance partition
+)
+```
+**fit() Parameters:**
+| Parameter | Type | Description |
+|-----------|------|-------------|
+| `data` | DataFrame | Panel data |
+| `outcome` | str | Outcome variable column name |
+| `unit` | str | Unit identifier column |
+| `time` | str | Time period column |
+| `first_treat` | str | First treatment period column (0 for never-treated) |
+| `covariates` | list | Covariate column names |
+| `aggregate` | str | Aggregation: None, "event_study", "group", "all" |
+| `balance_e` | int | Balance event study to this many pre-treatment periods |
+### ImputationDiDResults
+**Attributes:**
+| Attribute | Description |
+|-----------|-------------|
+| `overall_att` | Overall average treatment effect on the treated |
+| `overall_se` | Standard error (conservative, Theorem 3) |
+| `overall_t_stat` | T-statistic |
+| `overall_p_value` | P-value for H0: ATT = 0 |
+| `overall_conf_int` | Confidence interval |
+| `event_study_effects` | Dict of relative time -> effect dict (if `aggregate='event_study'` or `'all'`) |
+| `group_effects` | Dict of cohort -> effect dict (if `aggregate='group'` or `'all'`) |
+| `treatment_effects` | DataFrame of unit-level imputed treatment effects |
+| `n_treated_obs` | Number of treated observations |
+| `n_untreated_obs` | Number of untreated observations |
+**Methods:**
+| Method | Description |
+|--------|-------------|
+| `summary(alpha)` | Get formatted summary string |
+| `print_summary(alpha)` | Print summary to stdout |
+| `to_dataframe(level)` | Convert to DataFrame ('observation', 'event_study', 'group') |
+| `pretrend_test(n_leads)` | Run pre-trend F-test (Equation 9) |
 ### TripleDifference
 ```python
@@ -2489,6 +2603,14 @@ The `HonestDiD` module implements sensitivity analysis methods for relaxing the
 ### Multi-Period and Staggered Adoption
+- **Borusyak, K., Jaravel, X., & Spiess, J. (2024).** "Revisiting Event-Study Designs: Robust and Efficient Estimation." *Review of Economic Studies*, 91(6), 3253-3285. [https://doi.org/10.1093/restud/rdae007](https://doi.org/10.1093/restud/rdae007)
+  This paper introduces the imputation estimator implemented in our `ImputationDiD` class:
+  - **Efficient imputation**: OLS on untreated observations → impute counterfactuals → aggregate
+  - **Conservative variance**: Theorem 3 clustered variance estimator with auxiliary model
+  - **Pre-trend test**: Independent of treatment effect estimation (Proposition 9)
+  - **Efficiency gains**: ~50% shorter CIs than Callaway-Sant'Anna under homogeneous effects
 - **Callaway, B., & Sant'Anna, P. H. C. (2021).** "Difference-in-Differences with Multiple Time Periods." *Journal of Econometrics*, 225(2), 200-230. [https://doi.org/10.1016/j.jeconom.2020.12.001](https://doi.org/10.1016/j.jeconom.2020.12.001)
 - **Sant'Anna, P. H. C., & Zhao, J. (2020).** "Doubly Robust Difference-in-Differences Estimators." *Journal of Econometrics*, 219(1), 101-122. [https://doi.org/10.1016/j.jeconom.2020.06.003](https://doi.org/10.1016/j.jeconom.2020.06.003)

{diff_diff-2.2.0 → diff_diff-2.3.0}/README.md RENAMED Viewed

@@ -70,7 +70,7 @@ Signif. codes: '***' 0.001, '**' 0.01, '*' 0.05, '.' 0.1
 - **Wild cluster bootstrap**: Valid inference with few clusters (<50) using Rademacher, Webb, or Mammen weights
 - **Panel data support**: Two-way fixed effects estimator for panel designs
 - **Multi-period analysis**: Event-study style DiD with period-specific treatment effects
-- **Staggered adoption**: Callaway-Sant'Anna (2021) and Sun-Abraham (2021) estimators for heterogeneous treatment timing
+- **Staggered adoption**: Callaway-Sant'Anna (2021), Sun-Abraham (2021), and Borusyak-Jaravel-Spiess (2024) imputation estimators for heterogeneous treatment timing
 - **Triple Difference (DDD)**: Ortiz-Villavicencio & Sant'Anna (2025) estimators with proper covariate handling
 - **Synthetic DiD**: Combined DiD with synthetic control for improved robustness
 - **Triply Robust Panel (TROP)**: Factor-adjusted DiD with synthetic weights (Athey et al. 2025)
@@ -561,12 +561,13 @@ results = twfe.fit(
 ### Multi-Period DiD (Event Study)
-For settings with multiple pre- and post-treatment periods:
+For settings with multiple pre- and post-treatment periods. Estimates treatment × period
+interactions for ALL periods (pre and post), enabling parallel trends assessment:
 ```python
 from diff_diff import MultiPeriodDiD
-# Fit with multiple time periods
+# Fit full event study with pre and post period effects
 did = MultiPeriodDiD()
 results = did.fit(
     panel_data,
@@ -574,18 +575,23 @@ results = did.fit(
     treatment='treated',
     time='period',
     post_periods=[3, 4, 5],      # Periods 3-5 are post-treatment
-    reference_period=0           # Reference period for comparison
+    reference_period=2,          # Last pre-period (e=-1 convention)
+    unit='unit_id',              # Optional: warns if staggered adoption detected
 )
-# View period-specific treatment effects
-for period, effect in results.period_effects.items():
-    print(f"Period {period}: {effect.effect:.3f} (SE: {effect.se:.3f})")
+# Pre-period effects test parallel trends (should be ≈ 0)
+for period, effect in results.pre_period_effects.items():
+    print(f"Pre {period}: {effect.effect:.3f} (SE: {effect.se:.3f})")
+# Post-period effects estimate dynamic treatment effects
+for period, effect in results.post_period_effects.items():
+    print(f"Post {period}: {effect.effect:.3f} (SE: {effect.se:.3f})")
 # View average treatment effect across post-periods
 print(f"Average ATT: {results.avg_att:.3f}")
 print(f"Average SE: {results.avg_se:.3f}")
-# Full summary with all period effects
+# Full summary with pre and post period effects
 results.print_summary()
 ```
@@ -873,6 +879,54 @@ print(f"Sun-Abraham ATT: {sa_results.overall_att:.3f}")
 # If results differ substantially, investigate heterogeneity
 ```
+### Borusyak-Jaravel-Spiess Imputation Estimator
+The Borusyak et al. (2024) imputation estimator is the **efficient** estimator for staggered DiD under parallel trends, producing ~50% shorter confidence intervals than Callaway-Sant'Anna and 2-3.5x shorter than Sun-Abraham under homogeneous treatment effects.
+```python
+from diff_diff import ImputationDiD, imputation_did
+# Basic usage
+est = ImputationDiD()
+results = est.fit(data, outcome='outcome', unit='unit',
+                  time='period', first_treat='first_treat')
+results.print_summary()
+# Event study
+results = est.fit(data, outcome='outcome', unit='unit',
+                  time='period', first_treat='first_treat',
+                  aggregate='event_study')
+# Pre-trend test (Equation 9)
+pt = results.pretrend_test(n_leads=3)
+print(f"F-stat: {pt['f_stat']:.3f}, p-value: {pt['p_value']:.4f}")
+# Convenience function
+results = imputation_did(data, 'outcome', 'unit', 'period', 'first_treat',
+                         aggregate='all')
+```
+```python
+ImputationDiD(
+    anticipation=0,         # Number of anticipation periods
+    alpha=0.05,             # Significance level
+    cluster=None,           # Cluster variable (defaults to unit)
+    n_bootstrap=0,          # Bootstrap iterations (0=analytical inference)
+    seed=None,              # Random seed
+    horizon_max=None,       # Max event-study horizon
+    aux_partition="cohort_horizon",  # Variance partition: "cohort_horizon", "cohort", "horizon"
+)
+```
+**When to use Imputation DiD vs Callaway-Sant'Anna:**
+| Aspect | Imputation DiD | Callaway-Sant'Anna |
+|--------|---------------|-------------------|
+| Efficiency | Most efficient under homogeneous effects | Less efficient but more robust to heterogeneity |
+| Control group | Always uses all untreated obs | Choice of never-treated or not-yet-treated |
+| Inference | Conservative variance (Theorem 3) | Multiplier bootstrap |
+| Pre-trends | Built-in F-test (Equation 9) | Separate testing |
 ### Triple Difference (DDD)
 Triple Difference (DDD) is used when treatment requires satisfying two criteria: belonging to a treated **group** AND being in an eligible **partition**. The `TripleDifference` class implements the methodology from Ortiz-Villavicencio & Sant'Anna (2025), which correctly handles covariate adjustment (unlike naive implementations).
@@ -951,10 +1005,10 @@ Create publication-ready event study plots:
 ```python
 from diff_diff import plot_event_study, MultiPeriodDiD, CallawaySantAnna, SunAbraham
-# From MultiPeriodDiD
+# From MultiPeriodDiD (full event study with pre and post period effects)
 did = MultiPeriodDiD()
 results = did.fit(data, outcome='y', treatment='treated',
-                  time='period', post_periods=[3, 4, 5])
+                  time='period', post_periods=[3, 4, 5], reference_period=2)
 plot_event_study(results, title="Treatment Effects Over Time")
 # From CallawaySantAnna (with event study aggregation)
@@ -1274,7 +1328,6 @@ TROP(
     max_iter=100,               # Max iterations for factor estimation
     tol=1e-6,                   # Convergence tolerance
     alpha=0.05,                 # Significance level
-    variance_method='bootstrap', # 'bootstrap' or 'jackknife'
     n_bootstrap=200,            # Bootstrap replications
     seed=None                   # Random seed
 )
@@ -1414,14 +1467,15 @@ Pre-trends tests have low power and can exacerbate bias. **Honest DiD** (Rambach
 ```python
 from diff_diff import HonestDiD, MultiPeriodDiD
-# First, fit a standard event study
+# First, fit a full event study (pre + post period effects)
 did = MultiPeriodDiD()
 event_results = did.fit(
     data,
     outcome='outcome',
     treatment='treated',
     time='period',
-    post_periods=[5, 6, 7, 8, 9]
+    post_periods=[5, 6, 7, 8, 9],
+    reference_period=4,          # Last pre-period (e=-1 convention)
 )
 # Compute honest bounds with relative magnitudes restriction
@@ -1489,14 +1543,15 @@ A passing pre-trends test doesn't mean parallel trends holds—it may just mean
 ```python
 from diff_diff import PreTrendsPower, MultiPeriodDiD
-# First, fit an event study
+# First, fit a full event study
 did = MultiPeriodDiD()
 event_results = did.fit(
     data,
     outcome='outcome',
     treatment='treated',
     time='period',
-    post_periods=[5, 6, 7, 8, 9]
+    post_periods=[5, 6, 7, 8, 9],
+    reference_period=4,
 )
 # Analyze pre-trends test power
@@ -1765,7 +1820,8 @@ MultiPeriodDiD(
 | `covariates` | list | Linear control variables |
 | `fixed_effects` | list | Categorical FE columns (creates dummies) |
 | `absorb` | list | High-dimensional FE (within-transformation) |
-| `reference_period` | any | Omitted period for time dummies |
+| `reference_period` | any | Omitted period (default: last pre-period, e=-1 convention) |
+| `unit` | str | Unit identifier column (for staggered adoption warning) |
 ### MultiPeriodDiDResults
@@ -1773,8 +1829,8 @@ MultiPeriodDiD(
 | Attribute | Description |
 |-----------|-------------|
-| `period_effects` | Dict mapping periods to PeriodEffect objects |
-| `avg_att` | Average ATT across post-treatment periods |
+| `period_effects` | Dict mapping periods to PeriodEffect objects (pre and post, excluding reference) |
+| `avg_att` | Average ATT across post-treatment periods only |
 | `avg_se` | Standard error of average ATT |
 | `avg_t_stat` | T-statistic for average ATT |
 | `avg_p_value` | P-value for average ATT |
@@ -1782,6 +1838,10 @@ MultiPeriodDiD(
 | `n_obs` | Number of observations |
 | `pre_periods` | List of pre-treatment periods |
 | `post_periods` | List of post-treatment periods |
+| `reference_period` | The omitted reference period (coefficient = 0 by construction) |
+| `interaction_indices` | Dict mapping period → column index in VCV (for sub-VCV extraction) |
+| `pre_period_effects` | Property: pre-period effects only (for parallel trends assessment) |
+| `post_period_effects` | Property: post-period effects only |
 **Methods:**
@@ -1874,8 +1934,7 @@ TROP(
     max_iter=100,              # Max iterations for factor estimation
     tol=1e-6,                  # Convergence tolerance
     alpha=0.05,                # Significance level for CIs
-    variance_method='bootstrap',  # 'bootstrap' or 'jackknife'
-    n_bootstrap=200,           # Bootstrap/jackknife iterations
+    n_bootstrap=200,           # Bootstrap replications
     seed=None                  # Random seed
 )
 ```
@@ -1899,7 +1958,7 @@ Note: TROP infers treatment periods from the treatment indicator column. The tre
 | Attribute | Description |
 |-----------|-------------|
 | `att` | Average Treatment effect on the Treated |
-| `se` | Standard error (bootstrap or jackknife) |
+| `se` | Standard error (bootstrap) |
 | `t_stat` | T-statistic |
 | `p_value` | P-value |
 | `conf_int` | Confidence interval |
@@ -1918,7 +1977,6 @@ Note: TROP infers treatment periods from the treatment indicator column. The tre
 | `loocv_score` | LOOCV score for selected parameters |
 | `n_pre_periods` | Number of pre-treatment periods |
 | `n_post_periods` | Number of post-treatment periods |
-| `variance_method` | Variance estimation method |
 | `bootstrap_distribution` | Bootstrap distribution (if bootstrap) |
 **Methods:**
@@ -1990,6 +2048,60 @@ SunAbraham(
 | `print_summary(alpha)` | Print summary to stdout |
 | `to_dataframe(level)` | Convert to DataFrame ('event_study' or 'cohort') |
+### ImputationDiD
+```python
+ImputationDiD(
+    anticipation=0,                   # Periods of anticipation effects
+    alpha=0.05,                       # Significance level for CIs
+    cluster=None,                     # Column for cluster-robust SEs
+    n_bootstrap=0,                    # Bootstrap iterations (0 = analytical)
+    seed=None,                        # Random seed
+    rank_deficient_action='warn',     # 'warn', 'error', or 'silent'
+    horizon_max=None,                 # Max event-study horizon
+    aux_partition='cohort_horizon',   # Variance partition
+)
+```
+**fit() Parameters:**
+| Parameter | Type | Description |
+|-----------|------|-------------|
+| `data` | DataFrame | Panel data |
+| `outcome` | str | Outcome variable column name |
+| `unit` | str | Unit identifier column |
+| `time` | str | Time period column |
+| `first_treat` | str | First treatment period column (0 for never-treated) |
+| `covariates` | list | Covariate column names |
+| `aggregate` | str | Aggregation: None, "event_study", "group", "all" |
+| `balance_e` | int | Balance event study to this many pre-treatment periods |
+### ImputationDiDResults
+**Attributes:**
+| Attribute | Description |
+|-----------|-------------|
+| `overall_att` | Overall average treatment effect on the treated |
+| `overall_se` | Standard error (conservative, Theorem 3) |
+| `overall_t_stat` | T-statistic |
+| `overall_p_value` | P-value for H0: ATT = 0 |
+| `overall_conf_int` | Confidence interval |
+| `event_study_effects` | Dict of relative time -> effect dict (if `aggregate='event_study'` or `'all'`) |
+| `group_effects` | Dict of cohort -> effect dict (if `aggregate='group'` or `'all'`) |
+| `treatment_effects` | DataFrame of unit-level imputed treatment effects |
+| `n_treated_obs` | Number of treated observations |
+| `n_untreated_obs` | Number of untreated observations |
+**Methods:**
+| Method | Description |
+|--------|-------------|
+| `summary(alpha)` | Get formatted summary string |
+| `print_summary(alpha)` | Print summary to stdout |
+| `to_dataframe(level)` | Convert to DataFrame ('observation', 'event_study', 'group') |
+| `pretrend_test(n_leads)` | Run pre-trend F-test (Equation 9) |
 ### TripleDifference
 ```python
@@ -2454,6 +2566,14 @@ The `HonestDiD` module implements sensitivity analysis methods for relaxing the
 ### Multi-Period and Staggered Adoption
+- **Borusyak, K., Jaravel, X., & Spiess, J. (2024).** "Revisiting Event-Study Designs: Robust and Efficient Estimation." *Review of Economic Studies*, 91(6), 3253-3285. [https://doi.org/10.1093/restud/rdae007](https://doi.org/10.1093/restud/rdae007)
+  This paper introduces the imputation estimator implemented in our `ImputationDiD` class:
+  - **Efficient imputation**: OLS on untreated observations → impute counterfactuals → aggregate
+  - **Conservative variance**: Theorem 3 clustered variance estimator with auxiliary model
+  - **Pre-trend test**: Independent of treatment effect estimation (Proposition 9)
+  - **Efficiency gains**: ~50% shorter CIs than Callaway-Sant'Anna under homogeneous effects
 - **Callaway, B., & Sant'Anna, P. H. C. (2021).** "Difference-in-Differences with Multiple Time Periods." *Journal of Econometrics*, 225(2), 200-230. [https://doi.org/10.1016/j.jeconom.2020.12.001](https://doi.org/10.1016/j.jeconom.2020.12.001)
 - **Sant'Anna, P. H. C., & Zhao, J. (2020).** "Doubly Robust Difference-in-Differences Estimators." *Journal of Econometrics*, 219(1), 101-122. [https://doi.org/10.1016/j.jeconom.2020.06.003](https://doi.org/10.1016/j.jeconom.2020.06.003)

{diff_diff-2.2.0 → diff_diff-2.3.0}/diff_diff/__init__.py RENAMED Viewed

@@ -95,6 +95,12 @@ from diff_diff.staggered import (
     CSBootstrapResults,
     GroupTimeEffect,
 )
+from diff_diff.imputation import (
+    ImputationBootstrapResults,
+    ImputationDiD,
+    ImputationDiDResults,
+    imputation_did,
+)
 from diff_diff.sun_abraham import (
     SABootstrapResults,
     SunAbraham,
@@ -136,7 +142,7 @@ from diff_diff.datasets import (
     load_mpdta,
 )
-__version__ = "2.2.0"
+__version__ = "2.3.0"
 __all__ = [
     # Estimators
     "DifferenceInDifferences",
@@ -145,6 +151,7 @@ __all__ = [
     "SyntheticDiD",
     "CallawaySantAnna",
     "SunAbraham",
+    "ImputationDiD",
     "TripleDifference",
     "TROP",
     # Bacon Decomposition
@@ -163,6 +170,9 @@ __all__ = [
     "GroupTimeEffect",
     "SunAbrahamResults",
     "SABootstrapResults",
+    "ImputationDiDResults",
+    "ImputationBootstrapResults",
+    "imputation_did",
     "TripleDifferenceResults",
     "triple_difference",
     "TROPResults",

{diff_diff-2.2.0 → diff_diff-2.3.0}/diff_diff/diagnostics.py RENAMED Viewed

@@ -662,7 +662,7 @@ def permutation_test(
     ci_upper = np.percentile(valid_effects, (1 - alpha / 2) * 100)
     # T-stat from original estimate
-    t_stat = original_att / se if se > 0 else 0.0
+    t_stat = original_att / se if np.isfinite(se) and se > 0 else np.nan
     return PlaceboTestResults(
         test_type="permutation",
@@ -783,14 +783,14 @@ def leave_one_out_test(
     # Statistics of LOO distribution
     mean_effect = np.mean(valid_effects)
     se = np.std(valid_effects, ddof=1) if len(valid_effects) > 1 else 0.0
-    t_stat = mean_effect / se if se > 0 else 0.0
+    t_stat = mean_effect / se if np.isfinite(se) and se > 0 else np.nan
     # Use t-distribution for p-value
     df = len(valid_effects) - 1 if len(valid_effects) > 1 else 1
     p_value = compute_p_value(t_stat, df=df)
     # CI
-    conf_int = compute_confidence_interval(mean_effect, se, alpha, df=df)
+    conf_int = compute_confidence_interval(mean_effect, se, alpha, df=df) if np.isfinite(se) and se > 0 else (np.nan, np.nan)
     return PlaceboTestResults(
         test_type="leave_one_out",

diff-diff 2.2.0__tar.gz → 2.3.0__tar.gz

diff-diff 2.2.0tar.gz → 2.3.0tar.gz