PyPI - panelbox - Versions diffs - 0.2.0__py3-none-any.whl - Mend

panelbox 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (90) hide show

panelbox/__init__.py +67 -0
panelbox/__version__.py +14 -0
panelbox/cli/__init__.py +0 -0
panelbox/cli/{commands}/__init__.py +0 -0
panelbox/core/__init__.py +0 -0
panelbox/core/base_model.py +164 -0
panelbox/core/formula_parser.py +318 -0
panelbox/core/panel_data.py +387 -0
panelbox/core/results.py +366 -0
panelbox/datasets/__init__.py +0 -0
panelbox/datasets/{data}/__init__.py +0 -0
panelbox/gmm/__init__.py +65 -0
panelbox/gmm/difference_gmm.py +645 -0
panelbox/gmm/estimator.py +562 -0
panelbox/gmm/instruments.py +580 -0
panelbox/gmm/results.py +550 -0
panelbox/gmm/system_gmm.py +621 -0
panelbox/gmm/tests.py +535 -0
panelbox/models/__init__.py +11 -0
panelbox/models/dynamic/__init__.py +0 -0
panelbox/models/iv/__init__.py +0 -0
panelbox/models/static/__init__.py +13 -0
panelbox/models/static/fixed_effects.py +516 -0
panelbox/models/static/pooled_ols.py +298 -0
panelbox/models/static/random_effects.py +512 -0
panelbox/report/__init__.py +61 -0
panelbox/report/asset_manager.py +410 -0
panelbox/report/css_manager.py +472 -0
panelbox/report/exporters/__init__.py +15 -0
panelbox/report/exporters/html_exporter.py +440 -0
panelbox/report/exporters/latex_exporter.py +510 -0
panelbox/report/exporters/markdown_exporter.py +446 -0
panelbox/report/renderers/__init__.py +11 -0
panelbox/report/renderers/static/__init__.py +0 -0
panelbox/report/renderers/static_validation_renderer.py +341 -0
panelbox/report/report_manager.py +502 -0
panelbox/report/template_manager.py +337 -0
panelbox/report/transformers/__init__.py +0 -0
panelbox/report/transformers/static/__init__.py +0 -0
panelbox/report/validation_transformer.py +449 -0
panelbox/standard_errors/__init__.py +0 -0
panelbox/templates/__init__.py +0 -0
panelbox/templates/assets/css/base_styles.css +382 -0
panelbox/templates/assets/css/report_components.css +747 -0
panelbox/templates/assets/js/tab-navigation.js +161 -0
panelbox/templates/assets/js/utils.js +276 -0
panelbox/templates/common/footer.html +24 -0
panelbox/templates/common/header.html +44 -0
panelbox/templates/common/meta.html +5 -0
panelbox/templates/validation/interactive/index.html +272 -0
panelbox/templates/validation/interactive/partials/charts.html +58 -0
panelbox/templates/validation/interactive/partials/methodology.html +201 -0
panelbox/templates/validation/interactive/partials/overview.html +146 -0
panelbox/templates/validation/interactive/partials/recommendations.html +101 -0
panelbox/templates/validation/interactive/partials/test_results.html +231 -0
panelbox/utils/__init__.py +0 -0
panelbox/utils/formatting.py +172 -0
panelbox/utils/matrix_ops.py +233 -0
panelbox/utils/statistical.py +173 -0
panelbox/validation/__init__.py +58 -0
panelbox/validation/base.py +175 -0
panelbox/validation/cointegration/__init__.py +0 -0
panelbox/validation/cross_sectional_dependence/__init__.py +13 -0
panelbox/validation/cross_sectional_dependence/breusch_pagan_lm.py +222 -0
panelbox/validation/cross_sectional_dependence/frees.py +297 -0
panelbox/validation/cross_sectional_dependence/pesaran_cd.py +188 -0
panelbox/validation/heteroskedasticity/__init__.py +13 -0
panelbox/validation/heteroskedasticity/breusch_pagan.py +222 -0
panelbox/validation/heteroskedasticity/modified_wald.py +172 -0
panelbox/validation/heteroskedasticity/white.py +208 -0
panelbox/validation/instruments/__init__.py +0 -0
panelbox/validation/robustness/__init__.py +0 -0
panelbox/validation/serial_correlation/__init__.py +13 -0
panelbox/validation/serial_correlation/baltagi_wu.py +220 -0
panelbox/validation/serial_correlation/breusch_godfrey.py +260 -0
panelbox/validation/serial_correlation/wooldridge_ar.py +200 -0
panelbox/validation/specification/__init__.py +16 -0
panelbox/validation/specification/chow.py +273 -0
panelbox/validation/specification/hausman.py +264 -0
panelbox/validation/specification/mundlak.py +331 -0
panelbox/validation/specification/reset.py +273 -0
panelbox/validation/unit_root/__init__.py +0 -0
panelbox/validation/validation_report.py +257 -0
panelbox/validation/validation_suite.py +401 -0
panelbox-0.2.0.dist-info/METADATA +337 -0
panelbox-0.2.0.dist-info/RECORD +90 -0
panelbox-0.2.0.dist-info/WHEEL +5 -0
panelbox-0.2.0.dist-info/entry_points.txt +2 -0
panelbox-0.2.0.dist-info/licenses/LICENSE +21 -0
panelbox-0.2.0.dist-info/top_level.txt +1 -0

panelbox/core/results.py ADDED Viewed

@@ -0,0 +1,366 @@
+"""
+Results container for panel econometric models.
+This module provides the PanelResults class which stores estimation results
+and provides methods for inference, prediction, and reporting.
+"""
+from typing import Optional, Dict, Any, List
+import numpy as np
+import pandas as pd
+from scipy import stats
+class PanelResults:
+    """
+    Container for panel model estimation results.
+    This class stores all estimation results and provides methods for
+    inference, testing, prediction, and reporting.
+    Parameters
+    ----------
+    params : pd.Series
+        Estimated coefficients
+    std_errors : pd.Series
+        Standard errors
+    cov_params : pd.DataFrame
+        Covariance matrix of parameters
+    resid : np.ndarray
+        Residuals
+    fittedvalues : np.ndarray
+        Fitted values
+    model_info : dict
+        Dictionary with model information
+    data_info : dict
+        Dictionary with data information
+    Attributes
+    ----------
+    params : pd.Series
+        Estimated coefficients with parameter names
+    std_errors : pd.Series
+        Standard errors
+    tvalues : pd.Series
+        t-statistics
+    pvalues : pd.Series
+        p-values for two-sided t-tests
+    cov_params : pd.DataFrame
+        Covariance matrix of parameters
+    resid : np.ndarray
+        Residuals
+    fittedvalues : np.ndarray
+        Fitted values
+    nobs : int
+        Number of observations
+    n_entities : int
+        Number of entities
+    n_periods : int
+        Number of time periods
+    df_model : int
+        Degrees of freedom for model
+    df_resid : int
+        Degrees of freedom for residuals
+    rsquared : float
+        R-squared
+    rsquared_adj : float
+        Adjusted R-squared
+    rsquared_within : float
+        Within R-squared (for panel models)
+    rsquared_between : float
+        Between R-squared (for panel models)
+    rsquared_overall : float
+        Overall R-squared (for panel models)
+    """
+    def __init__(
+        self,
+        params: pd.Series,
+        std_errors: pd.Series,
+        cov_params: pd.DataFrame,
+        resid: np.ndarray,
+        fittedvalues: np.ndarray,
+        model_info: Dict[str, Any],
+        data_info: Dict[str, Any],
+        rsquared_dict: Optional[Dict[str, float]] = None,
+        model: Optional[Any] = None
+    ):
+        # Parameter estimates
+        self.params = params
+        self.std_errors = std_errors
+        self.cov_params = cov_params
+        # Residuals and fitted values
+        self.resid = resid
+        self.fittedvalues = fittedvalues
+        # Model information
+        self.model_type = model_info.get('model_type', 'Unknown')
+        self.formula = model_info.get('formula', '')
+        self.cov_type = model_info.get('cov_type', 'nonrobust')
+        self.cov_kwds = model_info.get('cov_kwds', {})
+        # Data information
+        self.nobs = data_info['nobs']
+        self.n_entities = data_info['n_entities']
+        self.n_periods = data_info.get('n_periods', None)
+        self.df_model = data_info['df_model']
+        self.df_resid = data_info['df_resid']
+        # Entity and time indices (for validation tests)
+        self.entity_index = data_info.get('entity_index', None)
+        self.time_index = data_info.get('time_index', None)
+        # Store reference to model for validation tests
+        self._model = model
+        # Compute t-values and p-values (after df_resid is defined)
+        self.tvalues = self.params / self.std_errors
+        # Ensure pvalues is a pandas Series with the same index as params
+        pvalues_array = 2 * (1 - stats.t.cdf(np.abs(self.tvalues.values), self.df_resid))
+        self.pvalues = pd.Series(pvalues_array, index=self.params.index)
+        # R-squared statistics
+        if rsquared_dict is not None:
+            self.rsquared = rsquared_dict.get('rsquared', np.nan)
+            self.rsquared_adj = rsquared_dict.get('rsquared_adj', np.nan)
+            self.rsquared_within = rsquared_dict.get('rsquared_within', np.nan)
+            self.rsquared_between = rsquared_dict.get('rsquared_between', np.nan)
+            self.rsquared_overall = rsquared_dict.get('rsquared_overall', np.nan)
+        else:
+            self.rsquared = np.nan
+            self.rsquared_adj = np.nan
+            self.rsquared_within = np.nan
+            self.rsquared_between = np.nan
+            self.rsquared_overall = np.nan
+    def conf_int(self, alpha: float = 0.05) -> pd.DataFrame:
+        """
+        Compute confidence intervals for parameters.
+        Parameters
+        ----------
+        alpha : float, default=0.05
+            Significance level (e.g., 0.05 for 95% CI)
+        Returns
+        -------
+        pd.DataFrame
+            Confidence intervals with columns 'lower' and 'upper'
+        Examples
+        --------
+        >>> ci = results.conf_int(alpha=0.05)
+        >>> print(ci)
+        """
+        t_critical = stats.t.ppf(1 - alpha/2, self.df_resid)
+        margin = t_critical * self.std_errors
+        ci = pd.DataFrame({
+            'lower': self.params - margin,
+            'upper': self.params + margin
+        }, index=self.params.index)
+        return ci
+    def predict(self, newdata: Optional[pd.DataFrame] = None) -> np.ndarray:
+        """
+        Generate predictions.
+        Parameters
+        ----------
+        newdata : pd.DataFrame, optional
+            New data for prediction. If None, returns fitted values.
+        Returns
+        -------
+        np.ndarray
+            Predicted values
+        Examples
+        --------
+        >>> predictions = results.predict()
+        >>> new_predictions = results.predict(new_data)
+        """
+        if newdata is None:
+            return self.fittedvalues
+        else:
+            raise NotImplementedError("Prediction on new data not yet implemented")
+    def summary(self, title: Optional[str] = None) -> str:
+        """
+        Generate formatted summary of results.
+        Parameters
+        ----------
+        title : str, optional
+            Custom title for summary table
+        Returns
+        -------
+        str
+            Formatted summary table
+        Examples
+        --------
+        >>> print(results.summary())
+        """
+        lines = []
+        # Header
+        lines.append("=" * 78)
+        if title is None:
+            title = f"{self.model_type} Estimation Results"
+        lines.append(title.center(78))
+        lines.append("=" * 78)
+        # Model information
+        lines.append(f"Formula: {self.formula}")
+        lines.append(f"Model:   {self.model_type}")
+        lines.append("-" * 78)
+        # Sample information
+        lines.append(f"No. Observations:          {self.nobs:>10,}")
+        lines.append(f"No. Entities:              {self.n_entities:>10,}")
+        if self.n_periods is not None:
+            lines.append(f"No. Time Periods:          {self.n_periods:>10,}")
+        lines.append(f"Degrees of Freedom:        {self.df_resid:>10,}")
+        # R-squared
+        if not np.isnan(self.rsquared):
+            lines.append(f"R-squared:                 {self.rsquared:>10.4f}")
+        if not np.isnan(self.rsquared_adj):
+            lines.append(f"Adj. R-squared:            {self.rsquared_adj:>10.4f}")
+        if not np.isnan(self.rsquared_within):
+            lines.append(f"R-squared (within):        {self.rsquared_within:>10.4f}")
+        if not np.isnan(self.rsquared_between):
+            lines.append(f"R-squared (between):       {self.rsquared_between:>10.4f}")
+        if not np.isnan(self.rsquared_overall):
+            lines.append(f"R-squared (overall):       {self.rsquared_overall:>10.4f}")
+        # Standard errors type
+        lines.append(f"Standard Errors:           {self.cov_type:>10}")
+        lines.append("=" * 78)
+        # Coefficient table
+        lines.append(f"{'Variable':<15} {'Coef.':<12} {'Std.Err.':<12} {'t':<8} {'P>|t|':<8} {'[0.025':<10} {'0.975]':<10}")
+        lines.append("-" * 78)
+        ci = self.conf_int(alpha=0.05)
+        for var in self.params.index:
+            coef = self.params[var]
+            se = self.std_errors[var]
+            t = self.tvalues[var]
+            p = self.pvalues[var]
+            ci_lower = ci.loc[var, 'lower']
+            ci_upper = ci.loc[var, 'upper']
+            # Significance stars
+            if p < 0.001:
+                stars = '***'
+            elif p < 0.01:
+                stars = '**'
+            elif p < 0.05:
+                stars = '*'
+            elif p < 0.10:
+                stars = '.'
+            else:
+                stars = ''
+            lines.append(
+                f"{var:<15} {coef:>11.4f} {se:>11.4f} {t:>7.3f} "
+                f"{p:>7.4f} {ci_lower:>9.4f} {ci_upper:>9.4f} {stars}"
+            )
+        lines.append("=" * 78)
+        lines.append("Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1")
+        lines.append("")
+        return "\n".join(lines)
+    def to_dict(self) -> Dict[str, Any]:
+        """
+        Export results as dictionary.
+        Returns
+        -------
+        dict
+            Dictionary with all results
+        """
+        return {
+            'params': self.params.to_dict(),
+            'std_errors': self.std_errors.to_dict(),
+            'tvalues': self.tvalues.to_dict(),
+            'pvalues': self.pvalues.to_dict(),
+            'model_info': {
+                'model_type': self.model_type,
+                'formula': self.formula,
+                'cov_type': self.cov_type,
+            },
+            'sample_info': {
+                'nobs': self.nobs,
+                'n_entities': self.n_entities,
+                'n_periods': self.n_periods,
+                'df_model': self.df_model,
+                'df_resid': self.df_resid,
+            },
+            'rsquared': {
+                'rsquared': self.rsquared,
+                'rsquared_adj': self.rsquared_adj,
+                'rsquared_within': self.rsquared_within,
+                'rsquared_between': self.rsquared_between,
+                'rsquared_overall': self.rsquared_overall,
+            }
+        }
+    def validate(
+        self,
+        tests: str = 'default',
+        alpha: float = 0.05,
+        verbose: bool = False
+    ) -> 'ValidationReport':
+        """
+        Run validation tests on model results.
+        Parameters
+        ----------
+        tests : str or list of str, default='default'
+            Which tests to run:
+            - 'all': Run all available tests
+            - 'default': Run recommended tests for this model type
+            - 'serial': Serial correlation tests only
+            - 'het': Heteroskedasticity tests only
+            - 'cd': Cross-sectional dependence tests only
+        alpha : float, default=0.05
+            Significance level for tests
+        verbose : bool, default=False
+            If True, print progress during testing
+        Returns
+        -------
+        ValidationReport
+            Report containing all test results
+        Examples
+        --------
+        >>> results = fe.fit()
+        >>> validation = results.validate(tests='all', verbose=True)
+        >>> print(validation)
+        """
+        from panelbox.validation.validation_suite import ValidationSuite
+        suite = ValidationSuite(self)
+        return suite.run(tests=tests, alpha=alpha, verbose=verbose)
+    def __repr__(self) -> str:
+        """String representation."""
+        return (f"PanelResults("
+                f"model='{self.model_type}', "
+                f"nobs={self.nobs}, "
+                f"k_params={len(self.params)})")
+    def __str__(self) -> str:
+        """String representation (calls summary)."""
+        return self.summary()

panelbox/datasets/__init__.py ADDED Viewed

File without changes

panelbox/datasets/{data}/__init__.py ADDED Viewed

File without changes

panelbox/gmm/__init__.py ADDED Viewed

@@ -0,0 +1,65 @@
+"""
+PanelBox GMM Module
+===================
+Dynamic panel data models using Generalized Method of Moments (GMM).
+This module implements:
+- Difference GMM (Arellano-Bond, 1991)
+- System GMM (Blundell-Bond, 1998)
+- One-step, two-step, and iterative estimation
+- Windmeijer (2005) finite-sample correction
+- Specification tests: Hansen J, Sargan, AR(1), AR(2)
+Classes
+-------
+DifferenceGMM : Arellano-Bond (1991) Difference GMM estimator
+SystemGMM : Blundell-Bond (1998) System GMM estimator
+GMMResults : Results from GMM estimation
+InstrumentBuilder : Generates instrument matrices
+GMMEstimator : Low-level GMM estimation routines
+GMMTests : Specification tests
+Examples
+--------
+>>> from panelbox.gmm import DifferenceGMM
+>>> model = DifferenceGMM(
+...     data=abdata,
+...     dep_var='n',
+...     lags=[1],
+...     exog_vars=['w', 'k'],
+...     time_dummies=True
+... )
+>>> results = model.fit()
+>>> print(results.summary())
+References
+----------
+.. [1] Arellano, M., & Bond, S. (1991). "Some Tests of Specification for Panel
+       Data: Monte Carlo Evidence and an Application to Employment Equations."
+       Review of Economic Studies, 58(2), 277-297.
+.. [2] Blundell, R., & Bond, S. (1998). "Initial Conditions and Moment
+       Restrictions in Dynamic Panel Data Models." Journal of Econometrics,
+       87(1), 115-143.
+.. [3] Roodman, D. (2009). "How to do xtabond2: An Introduction to Difference
+       and System GMM in Stata." Stata Journal, 9(1), 86-136.
+.. [4] Windmeijer, F. (2005). "A Finite Sample Correction for the Variance of
+       Linear Efficient Two-Step GMM Estimators." Journal of Econometrics,
+       126(1), 25-51.
+"""
+from panelbox.gmm.results import GMMResults, TestResult
+from panelbox.gmm.difference_gmm import DifferenceGMM
+from panelbox.gmm.system_gmm import SystemGMM
+__all__ = [
+    'DifferenceGMM',
+    'SystemGMM',
+    'GMMResults',
+    'TestResult',
+]
+__version__ = '0.1.0'