PyPI - statgpu - Versions diffs - 0.1.0__py3-none-any.whl - Mend

statgpu 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

statgpu/__init__.py +174 -0
statgpu/_base.py +544 -0
statgpu/_config.py +127 -0
statgpu/anova/__init__.py +5 -0
statgpu/anova/_oneway.py +194 -0
statgpu/backends/__init__.py +83 -0
statgpu/backends/_array_ops.py +529 -0
statgpu/backends/_base.py +184 -0
statgpu/backends/_cupy.py +453 -0
statgpu/backends/_factory.py +65 -0
statgpu/backends/_gpu_inference_cupy.py +214 -0
statgpu/backends/_gpu_inference_torch.py +422 -0
statgpu/backends/_numpy.py +324 -0
statgpu/backends/_torch.py +685 -0
statgpu/backends/_torch_safe.py +47 -0
statgpu/backends/_utils.py +423 -0
statgpu/core/__init__.py +10 -0
statgpu/core/formula/__init__.py +33 -0
statgpu/core/formula/_design.py +99 -0
statgpu/core/formula/_parser.py +191 -0
statgpu/core/formula/_terms.py +70 -0
statgpu/core/formula/tests/__init__.py +0 -0
statgpu/core/formula/tests/test_parser.py +194 -0
statgpu/covariance/__init__.py +6 -0
statgpu/covariance/_empirical.py +310 -0
statgpu/covariance/_shrinkage.py +248 -0
statgpu/cross_validation/__init__.py +31 -0
statgpu/cross_validation/_base.py +410 -0
statgpu/cross_validation/_engine.py +167 -0
statgpu/diagnostics/__init__.py +7 -0
statgpu/diagnostics/_regression_diagnostics.py +188 -0
statgpu/feature_selection/__init__.py +24 -0
statgpu/feature_selection/_knockoff.py +870 -0
statgpu/feature_selection/_knockoff_utils.py +1003 -0
statgpu/feature_selection/_stepwise.py +300 -0
statgpu/glm_core/__init__.py +81 -0
statgpu/glm_core/_base.py +202 -0
statgpu/glm_core/_family.py +362 -0
statgpu/glm_core/_fused.py +149 -0
statgpu/glm_core/_gamma.py +111 -0
statgpu/glm_core/_inverse_gaussian.py +62 -0
statgpu/glm_core/_irls.py +561 -0
statgpu/glm_core/_logistic.py +82 -0
statgpu/glm_core/_negative_binomial.py +68 -0
statgpu/glm_core/_poisson.py +60 -0
statgpu/glm_core/_solver_legacy.py +100 -0
statgpu/glm_core/_squared.py +53 -0
statgpu/glm_core/_tweedie.py +74 -0
statgpu/inference/__init__.py +239 -0
statgpu/inference/_distributions_backend.py +2610 -0
statgpu/inference/_multiple_testing.py +391 -0
statgpu/inference/_resampling.py +1400 -0
statgpu/inference/_results.py +265 -0
statgpu/linear_model/__init__.py +75 -0
statgpu/linear_model/_gaussian_inference.py +306 -0
statgpu/linear_model/_glm_base.py +1261 -0
statgpu/linear_model/_ordered_logit.py +52 -0
statgpu/linear_model/_ordered_probit.py +50 -0
statgpu/linear_model/_stats.py +170 -0
statgpu/linear_model/cv/__init__.py +13 -0
statgpu/linear_model/cv/_elasticnet_cv.py +892 -0
statgpu/linear_model/cv/_lasso_cv.py +253 -0
statgpu/linear_model/cv/_logistic_cv.py +895 -0
statgpu/linear_model/cv/_ridge_cv.py +1160 -0
statgpu/linear_model/legacy/__init__.py +1 -0
statgpu/linear_model/legacy/_distributions_legacy_gpu.py +340 -0
statgpu/linear_model/legacy/_elasticnet_legacy.py +936 -0
statgpu/linear_model/legacy/_lasso_legacy.py +4876 -0
statgpu/linear_model/legacy/_penalized_legacy.py +1174 -0
statgpu/linear_model/legacy/_ridge_legacy.py +863 -0
statgpu/linear_model/legacy/_solver_legacy.py +104 -0
statgpu/linear_model/penalized/__init__.py +25 -0
statgpu/linear_model/penalized/_base.py +437 -0
statgpu/linear_model/penalized/_fit_mixin.py +1877 -0
statgpu/linear_model/penalized/_inference_mixin.py +1179 -0
statgpu/linear_model/penalized/_penalized_cv.py +2699 -0
statgpu/linear_model/penalized/_penalized_gamma.py +86 -0
statgpu/linear_model/penalized/_penalized_inverse_gaussian.py +62 -0
statgpu/linear_model/penalized/_penalized_linear.py +236 -0
statgpu/linear_model/penalized/_penalized_logistic.py +100 -0
statgpu/linear_model/penalized/_penalized_negative_binomial.py +65 -0
statgpu/linear_model/penalized/_penalized_poisson.py +62 -0
statgpu/linear_model/penalized/_penalized_tweedie.py +65 -0
statgpu/linear_model/penalized/_predict_mixin.py +182 -0
statgpu/linear_model/wrappers/__init__.py +31 -0
statgpu/linear_model/wrappers/_adaptive_lasso.py +63 -0
statgpu/linear_model/wrappers/_elasticnet.py +75 -0
statgpu/linear_model/wrappers/_gamma.py +67 -0
statgpu/linear_model/wrappers/_inverse_gaussian.py +47 -0
statgpu/linear_model/wrappers/_lasso.py +2124 -0
statgpu/linear_model/wrappers/_linear.py +1127 -0
statgpu/linear_model/wrappers/_logistic.py +1435 -0
statgpu/linear_model/wrappers/_mcp.py +58 -0
statgpu/linear_model/wrappers/_negative_binomial.py +58 -0
statgpu/linear_model/wrappers/_poisson.py +48 -0
statgpu/linear_model/wrappers/_ridge.py +166 -0
statgpu/linear_model/wrappers/_scad.py +58 -0
statgpu/linear_model/wrappers/_tweedie.py +57 -0
statgpu/metrics/__init__.py +21 -0
statgpu/metrics/_classification.py +591 -0
statgpu/nonparametric/__init__.py +50 -0
statgpu/nonparametric/kernel_methods/__init__.py +25 -0
statgpu/nonparametric/kernel_methods/_kernels.py +246 -0
statgpu/nonparametric/kernel_methods/_krr.py +234 -0
statgpu/nonparametric/kernel_methods/_krr_cv.py +380 -0
statgpu/nonparametric/kernel_smoothing/__init__.py +39 -0
statgpu/nonparametric/kernel_smoothing/_bandwidth_selection.py +1083 -0
statgpu/nonparametric/kernel_smoothing/_kde.py +761 -0
statgpu/nonparametric/kernel_smoothing/_kernel_common.py +348 -0
statgpu/nonparametric/kernel_smoothing/_kernel_regression.py +748 -0
statgpu/nonparametric/splines/__init__.py +5 -0
statgpu/nonparametric/splines/_bspline_basis.py +336 -0
statgpu/nonparametric/splines/_penalized.py +349 -0
statgpu/panel/__init__.py +19 -0
statgpu/panel/_covariance.py +140 -0
statgpu/panel/_fixed_effects.py +420 -0
statgpu/panel/_random_effects.py +385 -0
statgpu/panel/_utils.py +482 -0
statgpu/penalties/__init__.py +139 -0
statgpu/penalties/_adaptive_l1.py +313 -0
statgpu/penalties/_base.py +261 -0
statgpu/penalties/_categories.py +39 -0
statgpu/penalties/_elasticnet.py +98 -0
statgpu/penalties/_group_lasso.py +678 -0
statgpu/penalties/_group_mcp.py +553 -0
statgpu/penalties/_group_scad.py +605 -0
statgpu/penalties/_l1.py +107 -0
statgpu/penalties/_l2.py +77 -0
statgpu/penalties/_mcp.py +237 -0
statgpu/penalties/_scad.py +260 -0
statgpu/semiparametric/__init__.py +5 -0
statgpu/semiparametric/_gam.py +401 -0
statgpu/solvers/__init__.py +24 -0
statgpu/solvers/_admm.py +241 -0
statgpu/solvers/_constants.py +15 -0
statgpu/solvers/_convergence.py +6 -0
statgpu/solvers/_fista.py +436 -0
statgpu/solvers/_fista_bb.py +513 -0
statgpu/solvers/_fista_lla.py +541 -0
statgpu/solvers/_lbfgs.py +206 -0
statgpu/solvers/_newton.py +149 -0
statgpu/solvers/_utils.py +277 -0
statgpu/survival/__init__.py +14 -0
statgpu/survival/_cox.py +3974 -0
statgpu/survival/_cox_breslow_triton_kernel.py +106 -0
statgpu/survival/_cox_cv.py +1159 -0
statgpu/survival/_cox_efron_cuda.py +1280 -0
statgpu/survival/_cox_efron_triton.py +359 -0
statgpu/unsupervised/__init__.py +29 -0
statgpu/unsupervised/_agglomerative.py +307 -0
statgpu/unsupervised/_dbscan.py +263 -0
statgpu/unsupervised/_dbscan_cpu.pyx +125 -0
statgpu/unsupervised/_gmm.py +332 -0
statgpu/unsupervised/_incremental_pca.py +176 -0
statgpu/unsupervised/_kmeans.py +261 -0
statgpu/unsupervised/_minibatch_kmeans.py +299 -0
statgpu/unsupervised/_minibatch_nmf.py +252 -0
statgpu/unsupervised/_nmf.py +190 -0
statgpu/unsupervised/_pca.py +189 -0
statgpu/unsupervised/_truncated_svd.py +132 -0
statgpu/unsupervised/_tsne.py +192 -0
statgpu/unsupervised/_umap.py +224 -0
statgpu/unsupervised/_utils.py +134 -0
statgpu-0.1.0.dist-info/METADATA +245 -0
statgpu-0.1.0.dist-info/RECORD +168 -0
statgpu-0.1.0.dist-info/WHEEL +5 -0
statgpu-0.1.0.dist-info/licenses/LICENSE +199 -0
statgpu-0.1.0.dist-info/top_level.txt +1 -0

statgpu/linear_model/_ordered_logit.py ADDED Viewed

@@ -0,0 +1,52 @@
+"""Ordered logistic regression (proportional odds model)."""
+import numpy as np
+from statgpu._config import Device
+from statgpu.glm_core._family import Binomial, LogitLink
+from statgpu.linear_model._glm_base import OrderedGeneralizedLinearModel
+class OrderedLogitRegression(OrderedGeneralizedLinearModel):
+    """Ordered logit regression with GPU support.
+    Also known as the proportional odds model.
+    Parameters
+    ----------
+    n_categories : int, default=3
+        Number of ordinal categories.
+    fit_intercept : bool, default=True
+    max_iter : int, default=100
+    tol : float, default=1e-4
+    C : float, default=1.0
+        Inverse regularization strength.
+    device : str or Device, default='auto'
+    """
+    def __init__(
+        self,
+        n_categories: int = 3,
+        fit_intercept: bool = True,
+        max_iter: int = 100,
+        tol: float = 1e-4,
+        C: float = 1.0,
+        device: Device = Device.AUTO,
+        n_jobs: int = None,
+        gpu_memory_cleanup: bool = False,
+    ):
+        super().__init__(
+            n_categories=n_categories,
+            family="binomial",
+            fit_intercept=fit_intercept,
+            max_iter=max_iter,
+            tol=tol,
+            C=C,
+            device=device,
+            n_jobs=n_jobs,
+            solver="auto",
+            gpu_memory_cleanup=gpu_memory_cleanup,
+        )
+    def _get_family(self):
+        return Binomial(link=LogitLink())

statgpu/linear_model/_ordered_probit.py ADDED Viewed

@@ -0,0 +1,50 @@
+"""Ordered probit regression."""
+import numpy as np
+from statgpu._config import Device
+from statgpu.glm_core._family import Binomial, ProbitLink
+from statgpu.linear_model._glm_base import OrderedGeneralizedLinearModel
+class OrderedProbitRegression(OrderedGeneralizedLinearModel):
+    """Ordered probit regression.
+    Parameters
+    ----------
+    n_categories : int, default=3
+        Number of ordinal categories.
+    fit_intercept : bool, default=True
+    max_iter : int, default=100
+    tol : float, default=1e-4
+    C : float, default=1.0
+        Inverse regularization strength.
+    device : str or Device, default='auto'
+    """
+    def __init__(
+        self,
+        n_categories: int = 3,
+        fit_intercept: bool = True,
+        max_iter: int = 100,
+        tol: float = 1e-4,
+        C: float = 1.0,
+        device: Device = Device.AUTO,
+        n_jobs: int = None,
+        gpu_memory_cleanup: bool = False,
+    ):
+        super().__init__(
+            n_categories=n_categories,
+            family="binomial",
+            fit_intercept=fit_intercept,
+            max_iter=max_iter,
+            tol=tol,
+            C=C,
+            device=device,
+            n_jobs=n_jobs,
+            solver="auto",
+            gpu_memory_cleanup=gpu_memory_cleanup,
+        )
+    def _get_family(self):
+        return Binomial(link=ProbitLink())

statgpu/linear_model/_stats.py ADDED Viewed

@@ -0,0 +1,170 @@
+"""
+Statistical inference for linear models.
+Computes standard errors, t-statistics, p-values, etc.
+"""
+import numpy as np
+from statgpu.inference import t as t_dist, f as f_dist
+class RegressionResults:
+    """
+    Results class for linear regression with statistical inference.
+    Similar to statsmodels RegressionResultsWrapper.
+    """
+    def __init__(self, model, params, resid, scale, nobs, df_resid):
+        """
+        Initialize results object.
+        Parameters
+        ----------
+        model : fitted model instance
+        params : ndarray
+            Estimated parameters (including intercept if fitted)
+        resid : ndarray
+            Residuals
+        scale : float
+            Estimate of error variance (sigma^2)
+        nobs : int
+            Number of observations
+        df_resid : int
+            Degrees of freedom of residuals
+        """
+        self.model = model
+        self.params = params
+        self.resid = resid
+        self.scale = scale
+        self.nobs = nobs
+        self.df_resid = df_resid
+        # Compute standard errors and statistics
+        self._compute_inference()
+    def _compute_inference(self):
+        """Compute standard errors, t-stats, p-values, confidence intervals."""
+        # Get design matrix
+        X = self.model._X_design
+        # Compute (X'X)^-1
+        try:
+            XtX_inv = np.linalg.inv(X.T @ X)
+        except np.linalg.LinAlgError:
+            XtX_inv = np.linalg.pinv(X.T @ X)
+        # Standard errors: sqrt(scale * diag((X'X)^-1))
+        self.bse = np.sqrt(self.scale * np.diag(XtX_inv))
+        # t-statistics: coef / std_err
+        self.tvalues = self.params / self.bse
+        # p-values: two-tailed t-test
+        self.pvalues = 2 * (1 - t_dist.cdf(np.abs(self.tvalues), df=self.df_resid))
+        # Confidence intervals (95%)
+        alpha = 0.05
+        t_crit = float(t_dist.ppf(1 - alpha/2, df=self.df_resid))
+        self.conf_int = np.column_stack([
+            self.params - t_crit * self.bse,
+            self.params + t_crit * self.bse
+        ])
+    @property
+    def rsquared(self):
+        """R-squared."""
+        y = self.model._y
+        y_mean = np.mean(y)
+        ss_tot = np.sum((y - y_mean) ** 2)
+        ss_res = np.sum(self.resid ** 2)
+        return 1 - ss_res / ss_tot if ss_tot > 0 else 0.0
+    @property
+    def rsquared_adj(self):
+        """Adjusted R-squared."""
+        n = self.nobs
+        k = len(self.params) - 1  # exclude intercept from count
+        return 1 - (1 - self.rsquared) * (n - 1) / (n - k - 1)
+    @property
+    def fvalue(self):
+        """F-statistic for overall model significance."""
+        y = self.model._y
+        y_mean = np.mean(y)
+        ss_tot = np.sum((y - y_mean) ** 2)
+        ss_res = np.sum(self.resid ** 2)
+        ss_reg = ss_tot - ss_res
+        k = len(self.params) - 1
+        if k == 0 or ss_res <= 0:
+            return np.inf
+        return (ss_reg / k) / (ss_res / self.df_resid)
+    @property
+    def f_pvalue(self):
+        """p-value for F-test."""
+        k = len(self.params) - 1
+        if k == 0:
+            return 1.0
+        return 1 - float(f_dist.cdf(self.fvalue, dfn=k, dfd=self.df_resid))
+    @property
+    def aic(self):
+        """Akaike Information Criterion."""
+        n = self.nobs
+        k = len(self.params)
+        return n * np.log(self.scale) + 2 * k
+    @property
+    def bic(self):
+        """Bayesian Information Criterion."""
+        n = self.nobs
+        k = len(self.params)
+        return n * np.log(self.scale) + k * np.log(n)
+    def summary(self):
+        """Print summary table similar to R's summary(lm())."""
+        # Get feature names
+        if hasattr(self.model, '_feature_names'):
+            feature_names = self.model._feature_names
+        else:
+            feature_names = ['(Intercept)'] + [f'x{i}' for i in range(len(self.params) - 1)]
+        # Build summary table
+        print("=" * 80)
+        print("Linear Regression Results")
+        print("=" * 80)
+        print(f"No. Observations:           {self.nobs:>15}")
+        print(f"Degrees of Freedom:         {self.df_resid:>15}")
+        print(f"R-squared:                  {self.rsquared:>15.4f}")
+        print(f"Adj. R-squared:             {self.rsquared_adj:>15.4f}")
+        print(f"F-statistic:                {self.fvalue:>15.4f}")
+        print(f"Prob (F-statistic):         {self.f_pvalue:>15.4e}")
+        print(f"Log-Likelihood:             {self.llf:>15.4f}")
+        print(f"AIC:                        {self.aic:>15.4f}")
+        print(f"BIC:                        {self.bic:>15.4f}")
+        print("-" * 80)
+        print(f"{'':<20} {'coef':>12} {'std err':>12} {'t':>10} {'P>|t|':>10} {'[0.025':>12} {'0.975]':>12}")
+        print("-" * 80)
+        for i, name in enumerate(feature_names):
+            print(f"{name:<20} {self.params[i]:>12.4f} {self.bse[i]:>12.4f} "
+                  f"{self.tvalues[i]:>10.3f} {self.pvalues[i]:>10.4f} "
+                  f"{self.conf_int[i, 0]:>12.4f} {self.conf_int[i, 1]:>12.4f}")
+        print("=" * 80)
+    @property
+    def llf(self):
+        """Log-likelihood."""
+        n = self.nobs
+        return -n/2 * (np.log(2 * np.pi * self.scale) + 1)
+    def conf_int(self, alpha=0.05):
+        """Confidence intervals for parameters."""
+        t_crit = float(t_dist.ppf(1 - alpha/2, df=self.df_resid))
+        return np.column_stack([
+            self.params - t_crit * self.bse,
+            self.params + t_crit * self.bse
+        ])

statgpu/linear_model/cv/__init__.py ADDED Viewed

@@ -0,0 +1,13 @@
+"""Cross-validated model wrappers (LassoCV, RidgeCV, ElasticNetCV, LogisticRegressionCV)."""
+from ._lasso_cv import LassoCV
+from ._ridge_cv import RidgeCV
+from ._elasticnet_cv import ElasticNetCV
+from ._logistic_cv import LogisticRegressionCV
+__all__ = [
+    "LassoCV",
+    "RidgeCV",
+    "ElasticNetCV",
+    "LogisticRegressionCV",
+]