PyPI - panelbox - Versions diffs - 0.2.0__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

panelbox 0.2.0py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

panelbox/__init__.py +41 -0
panelbox/__version__.py +13 -1
panelbox/core/formula_parser.py +9 -2
panelbox/core/panel_data.py +1 -1
panelbox/datasets/__init__.py +39 -0
panelbox/datasets/load.py +334 -0
panelbox/gmm/difference_gmm.py +63 -15
panelbox/gmm/estimator.py +46 -5
panelbox/gmm/system_gmm.py +136 -21
panelbox/models/static/__init__.py +4 -0
panelbox/models/static/between.py +434 -0
panelbox/models/static/first_difference.py +494 -0
panelbox/models/static/fixed_effects.py +80 -11
panelbox/models/static/pooled_ols.py +80 -11
panelbox/models/static/random_effects.py +52 -10
panelbox/standard_errors/__init__.py +119 -0
panelbox/standard_errors/clustered.py +386 -0
panelbox/standard_errors/comparison.py +528 -0
panelbox/standard_errors/driscoll_kraay.py +386 -0
panelbox/standard_errors/newey_west.py +324 -0
panelbox/standard_errors/pcse.py +358 -0
panelbox/standard_errors/robust.py +324 -0
panelbox/standard_errors/utils.py +390 -0
panelbox/validation/__init__.py +6 -0
panelbox/validation/robustness/__init__.py +51 -0
panelbox/validation/robustness/bootstrap.py +933 -0
panelbox/validation/robustness/checks.py +143 -0
panelbox/validation/robustness/cross_validation.py +538 -0
panelbox/validation/robustness/influence.py +364 -0
panelbox/validation/robustness/jackknife.py +457 -0
panelbox/validation/robustness/outliers.py +529 -0
panelbox/validation/robustness/sensitivity.py +809 -0
{panelbox-0.2.0.dist-info → panelbox-0.4.0.dist-info}/METADATA +32 -3
{panelbox-0.2.0.dist-info → panelbox-0.4.0.dist-info}/RECORD +38 -21
{panelbox-0.2.0.dist-info → panelbox-0.4.0.dist-info}/WHEEL +1 -1
{panelbox-0.2.0.dist-info → panelbox-0.4.0.dist-info}/entry_points.txt +0 -0
{panelbox-0.2.0.dist-info → panelbox-0.4.0.dist-info}/licenses/LICENSE +0 -0
{panelbox-0.2.0.dist-info → panelbox-0.4.0.dist-info}/top_level.txt +0 -0

panelbox/models/static/pooled_ols.py CHANGED Viewed

@@ -16,6 +16,14 @@ from panelbox.utils.matrix_ops import (
     compute_vcov_nonrobust,
     compute_rsquared
 )
+from panelbox.standard_errors import (
+    robust_covariance,
+    cluster_by_entity,
+    twoway_cluster,
+    driscoll_kraay,
+    newey_west,
+    pcse
+)
 class PooledOLS(PanelModel):
@@ -84,10 +92,17 @@ class PooledOLS(PanelModel):
         cov_type : str, default='nonrobust'
             Type of covariance estimator:
             - 'nonrobust': Classical OLS standard errors
-            - 'robust': Heteroskedasticity-robust (HC1)
+            - 'robust' or 'hc1': Heteroskedasticity-robust (HC1)
+            - 'hc0', 'hc2', 'hc3': Other HC variants
             - 'clustered': Cluster-robust (clustered by entity by default)
+            - 'twoway': Two-way clustering (entity and time)
+            - 'driscoll_kraay': Driscoll-Kraay for spatial/temporal dependence
+            - 'newey_west': Newey-West HAC
+            - 'pcse': Panel-corrected standard errors
         **cov_kwds
-            Additional arguments for covariance estimation
+            Additional arguments for covariance estimation:
+            - max_lags : int, for driscoll_kraay and newey_west
+            - kernel : str, for driscoll_kraay and newey_west
         Returns
         -------
@@ -96,8 +111,23 @@ class PooledOLS(PanelModel):
         Examples
         --------
+        >>> # Classical standard errors
+        >>> results = model.fit(cov_type='nonrobust')
+        >>>
+        >>> # Heteroskedasticity-robust
         >>> results = model.fit(cov_type='robust')
-        >>> results_cluster = model.fit(cov_type='clustered')
+        >>> results = model.fit(cov_type='hc3')
+        >>>
+        >>> # Cluster-robust
+        >>> results = model.fit(cov_type='clustered')
+        >>> results = model.fit(cov_type='twoway')
+        >>>
+        >>> # HAC
+        >>> results = model.fit(cov_type='driscoll_kraay', max_lags=3)
+        >>> results = model.fit(cov_type='newey_west', max_lags=4, kernel='bartlett')
+        >>>
+        >>> # PCSE
+        >>> results = model.fit(cov_type='pcse')
         """
         # Build design matrices
         y, X = self.formula_parser.build_design_matrices(
@@ -117,17 +147,56 @@ class PooledOLS(PanelModel):
         df_model = k - (1 if self.formula_parser.has_intercept else 0)
         df_resid = n - k
-        # Compute covariance matrix
-        if cov_type == 'nonrobust':
+        # Get entity and time indices
+        entities = self.data.data[self.data.entity_col].values
+        times = self.data.data[self.data.time_col].values
+        # Compute covariance matrix based on type
+        cov_type_lower = cov_type.lower()
+        if cov_type_lower == 'nonrobust':
             vcov = compute_vcov_nonrobust(X, resid, df_resid)
-        elif cov_type == 'robust':
-            vcov = self._compute_vcov_robust(X, resid)
-        elif cov_type == 'clustered':
-            vcov = self._compute_vcov_clustered(X, resid)
+        elif cov_type_lower in ['robust', 'hc0', 'hc1', 'hc2', 'hc3']:
+            # HC robust standard errors
+            method = 'HC1' if cov_type_lower == 'robust' else cov_type_lower.upper()
+            result = robust_covariance(X, resid, method=method)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'clustered':
+            # Cluster-robust by entity
+            result = cluster_by_entity(X, resid, entities, df_correction=True)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'twoway':
+            # Two-way clustering (entity and time)
+            result = twoway_cluster(X, resid, entities, times, df_correction=True)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'driscoll_kraay':
+            # Driscoll-Kraay for spatial/temporal dependence
+            max_lags = cov_kwds.get('max_lags', None)
+            kernel = cov_kwds.get('kernel', 'bartlett')
+            result = driscoll_kraay(X, resid, times, max_lags=max_lags, kernel=kernel)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'newey_west':
+            # Newey-West HAC
+            max_lags = cov_kwds.get('max_lags', None)
+            kernel = cov_kwds.get('kernel', 'bartlett')
+            result = newey_west(X, resid, max_lags=max_lags, kernel=kernel)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'pcse':
+            # Panel-corrected standard errors
+            result = pcse(X, resid, entities, times)
+            vcov = result.cov_matrix
         else:
             raise ValueError(
-                f"cov_type must be 'nonrobust', 'robust', or 'clustered', "
-                f"got '{cov_type}'"
+                f"cov_type must be one of: 'nonrobust', 'robust', 'hc0', 'hc1', "
+                f"'hc2', 'hc3', 'clustered', 'twoway', 'driscoll_kraay', "
+                f"'newey_west', 'pcse'. Got '{cov_type}'"
             )
         # Standard errors

panelbox/models/static/random_effects.py CHANGED Viewed

@@ -15,6 +15,13 @@ from panelbox.utils.matrix_ops import (
     compute_ols,
     compute_panel_rsquared
 )
+from panelbox.standard_errors import (
+    robust_covariance,
+    cluster_by_entity,
+    twoway_cluster,
+    driscoll_kraay,
+    newey_west
+)
 class RandomEffects(PanelModel):
@@ -121,10 +128,16 @@ class RandomEffects(PanelModel):
         cov_type : str, default='nonrobust'
             Type of covariance estimator:
             - 'nonrobust': Classical GLS standard errors
-            - 'robust': Heteroskedasticity-robust
-            - 'clustered': Cluster-robust (clustered by entity)
+            - 'robust' or 'hc1': Heteroskedasticity-robust (HC1)
+            - 'hc0', 'hc2', 'hc3': Other HC variants
+            - 'clustered': Cluster-robust (by entity by default)
+            - 'twoway': Two-way clustered (entity and time)
+            - 'driscoll_kraay': Driscoll-Kraay (spatial/temporal dependence)
+            - 'newey_west': Newey-West HAC
         **cov_kwds
-            Additional arguments for covariance estimation
+            Additional arguments for covariance estimation:
+            - max_lags: For Driscoll-Kraay and Newey-West
+            - kernel: For HAC estimators
         Returns
         -------
@@ -169,16 +182,45 @@ class RandomEffects(PanelModel):
         df_resid = n - k
         # Compute covariance matrix
-        if cov_type == 'nonrobust':
+        cov_type_lower = cov_type.lower()
+        if cov_type_lower == 'nonrobust':
             vcov = self._compute_vcov_gls(X, resid_gls, entities, df_resid)
-        elif cov_type == 'robust':
-            vcov = self._compute_vcov_robust(X_gls, resid_gls, df_resid)
-        elif cov_type == 'clustered':
-            vcov = self._compute_vcov_clustered(X_gls, resid_gls, entities, df_resid)
+        elif cov_type_lower in ['robust', 'hc0', 'hc1', 'hc2', 'hc3']:
+            # Map 'robust' to 'hc1' (default robust method)
+            method = 'HC1' if cov_type_lower == 'robust' else cov_type_lower.upper()
+            result = robust_covariance(X_gls, resid_gls, method=method)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'clustered':
+            # Default: cluster by entity
+            result = cluster_by_entity(X_gls, resid_gls, entities, df_correction=True)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'twoway':
+            # Two-way clustering: entity and time
+            result = twoway_cluster(X_gls, resid_gls, entities, times, df_correction=True)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'driscoll_kraay':
+            # Driscoll-Kraay for spatial/temporal dependence
+            max_lags = cov_kwds.get('max_lags', None)
+            kernel = cov_kwds.get('kernel', 'bartlett')
+            result = driscoll_kraay(X_gls, resid_gls, times, max_lags=max_lags, kernel=kernel)
+            vcov = result.cov_matrix
+        elif cov_type_lower == 'newey_west':
+            # Newey-West HAC
+            max_lags = cov_kwds.get('max_lags', None)
+            kernel = cov_kwds.get('kernel', 'bartlett')
+            result = newey_west(X_gls, resid_gls, max_lags=max_lags, kernel=kernel)
+            vcov = result.cov_matrix
         else:
             raise ValueError(
-                f"cov_type must be 'nonrobust', 'robust', or 'clustered', "
-                f"got '{cov_type}'"
+                f"cov_type must be one of: 'nonrobust', 'robust', 'hc0', 'hc1', 'hc2', 'hc3', "
+                f"'clustered', 'twoway', 'driscoll_kraay', 'newey_west', got '{cov_type}'"
             )
         # Standard errors

panelbox/standard_errors/__init__.py CHANGED Viewed

@@ -0,0 +1,119 @@
+"""
+Standard errors and covariance matrix estimation for panel data.
+This module provides various robust standard error estimators commonly
+used in panel data econometrics:
+- Heteroskedasticity-robust (HC0, HC1, HC2, HC3)
+- Cluster-robust (one-way and two-way)
+- Driscoll-Kraay (spatial and temporal dependence)
+- Newey-West HAC (heteroskedasticity and autocorrelation consistent)
+Examples
+--------
+>>> from panelbox.standard_errors import robust_covariance, cluster_by_entity
+>>>
+>>> # HC1 robust standard errors
+>>> result = robust_covariance(X, resid, method='HC1')
+>>> print(result.std_errors)
+>>>
+>>> # Cluster by entity
+>>> result = cluster_by_entity(X, resid, entity_ids)
+>>> print(result.std_errors)
+"""
+# Robust (HC) standard errors
+from .robust import (
+    RobustStandardErrors,
+    RobustCovarianceResult,
+    robust_covariance
+)
+# Clustered standard errors
+from .clustered import (
+    ClusteredStandardErrors,
+    ClusteredCovarianceResult,
+    cluster_by_entity,
+    cluster_by_time,
+    twoway_cluster
+)
+# Driscoll-Kraay standard errors
+from .driscoll_kraay import (
+    DriscollKraayStandardErrors,
+    DriscollKraayResult,
+    driscoll_kraay
+)
+# Newey-West HAC standard errors
+from .newey_west import (
+    NeweyWestStandardErrors,
+    NeweyWestResult,
+    newey_west
+)
+# Panel-Corrected Standard Errors (PCSE)
+from .pcse import (
+    PanelCorrectedStandardErrors,
+    PCSEResult,
+    pcse
+)
+# Standard Error Comparison
+from .comparison import (
+    StandardErrorComparison,
+    ComparisonResult
+)
+# Utilities
+from .utils import (
+    compute_leverage,
+    compute_bread,
+    compute_meat_hc,
+    sandwich_covariance,
+    hc_covariance,
+    clustered_covariance,
+    twoway_clustered_covariance
+)
+__all__ = [
+    # Robust (HC) SE
+    'RobustStandardErrors',
+    'RobustCovarianceResult',
+    'robust_covariance',
+    # Clustered SE
+    'ClusteredStandardErrors',
+    'ClusteredCovarianceResult',
+    'cluster_by_entity',
+    'cluster_by_time',
+    'twoway_cluster',
+    # Driscoll-Kraay SE
+    'DriscollKraayStandardErrors',
+    'DriscollKraayResult',
+    'driscoll_kraay',
+    # Newey-West HAC SE
+    'NeweyWestStandardErrors',
+    'NeweyWestResult',
+    'newey_west',
+    # Panel-Corrected SE (PCSE)
+    'PanelCorrectedStandardErrors',
+    'PCSEResult',
+    'pcse',
+    # Comparison
+    'StandardErrorComparison',
+    'ComparisonResult',
+    # Utilities
+    'compute_leverage',
+    'compute_bread',
+    'compute_meat_hc',
+    'sandwich_covariance',
+    'hc_covariance',
+    'clustered_covariance',
+    'twoway_clustered_covariance',
+]

panelbox 0.2.0__py3-none-any.whl → 0.4.0__py3-none-any.whl

panelbox 0.2.0py3-none-any.whl → 0.4.0py3-none-any.whl