PyPI - statgpu - Versions diffs - 0.1.0__py3-none-any.whl - Mend

statgpu 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (168) hide show

statgpu/__init__.py +174 -0
statgpu/_base.py +544 -0
statgpu/_config.py +127 -0
statgpu/anova/__init__.py +5 -0
statgpu/anova/_oneway.py +194 -0
statgpu/backends/__init__.py +83 -0
statgpu/backends/_array_ops.py +529 -0
statgpu/backends/_base.py +184 -0
statgpu/backends/_cupy.py +453 -0
statgpu/backends/_factory.py +65 -0
statgpu/backends/_gpu_inference_cupy.py +214 -0
statgpu/backends/_gpu_inference_torch.py +422 -0
statgpu/backends/_numpy.py +324 -0
statgpu/backends/_torch.py +685 -0
statgpu/backends/_torch_safe.py +47 -0
statgpu/backends/_utils.py +423 -0
statgpu/core/__init__.py +10 -0
statgpu/core/formula/__init__.py +33 -0
statgpu/core/formula/_design.py +99 -0
statgpu/core/formula/_parser.py +191 -0
statgpu/core/formula/_terms.py +70 -0
statgpu/core/formula/tests/__init__.py +0 -0
statgpu/core/formula/tests/test_parser.py +194 -0
statgpu/covariance/__init__.py +6 -0
statgpu/covariance/_empirical.py +310 -0
statgpu/covariance/_shrinkage.py +248 -0
statgpu/cross_validation/__init__.py +31 -0
statgpu/cross_validation/_base.py +410 -0
statgpu/cross_validation/_engine.py +167 -0
statgpu/diagnostics/__init__.py +7 -0
statgpu/diagnostics/_regression_diagnostics.py +188 -0
statgpu/feature_selection/__init__.py +24 -0
statgpu/feature_selection/_knockoff.py +870 -0
statgpu/feature_selection/_knockoff_utils.py +1003 -0
statgpu/feature_selection/_stepwise.py +300 -0
statgpu/glm_core/__init__.py +81 -0
statgpu/glm_core/_base.py +202 -0
statgpu/glm_core/_family.py +362 -0
statgpu/glm_core/_fused.py +149 -0
statgpu/glm_core/_gamma.py +111 -0
statgpu/glm_core/_inverse_gaussian.py +62 -0
statgpu/glm_core/_irls.py +561 -0
statgpu/glm_core/_logistic.py +82 -0
statgpu/glm_core/_negative_binomial.py +68 -0
statgpu/glm_core/_poisson.py +60 -0
statgpu/glm_core/_solver_legacy.py +100 -0
statgpu/glm_core/_squared.py +53 -0
statgpu/glm_core/_tweedie.py +74 -0
statgpu/inference/__init__.py +239 -0
statgpu/inference/_distributions_backend.py +2610 -0
statgpu/inference/_multiple_testing.py +391 -0
statgpu/inference/_resampling.py +1400 -0
statgpu/inference/_results.py +265 -0
statgpu/linear_model/__init__.py +75 -0
statgpu/linear_model/_gaussian_inference.py +306 -0
statgpu/linear_model/_glm_base.py +1261 -0
statgpu/linear_model/_ordered_logit.py +52 -0
statgpu/linear_model/_ordered_probit.py +50 -0
statgpu/linear_model/_stats.py +170 -0
statgpu/linear_model/cv/__init__.py +13 -0
statgpu/linear_model/cv/_elasticnet_cv.py +892 -0
statgpu/linear_model/cv/_lasso_cv.py +253 -0
statgpu/linear_model/cv/_logistic_cv.py +895 -0
statgpu/linear_model/cv/_ridge_cv.py +1160 -0
statgpu/linear_model/legacy/__init__.py +1 -0
statgpu/linear_model/legacy/_distributions_legacy_gpu.py +340 -0
statgpu/linear_model/legacy/_elasticnet_legacy.py +936 -0
statgpu/linear_model/legacy/_lasso_legacy.py +4876 -0
statgpu/linear_model/legacy/_penalized_legacy.py +1174 -0
statgpu/linear_model/legacy/_ridge_legacy.py +863 -0
statgpu/linear_model/legacy/_solver_legacy.py +104 -0
statgpu/linear_model/penalized/__init__.py +25 -0
statgpu/linear_model/penalized/_base.py +437 -0
statgpu/linear_model/penalized/_fit_mixin.py +1877 -0
statgpu/linear_model/penalized/_inference_mixin.py +1179 -0
statgpu/linear_model/penalized/_penalized_cv.py +2699 -0
statgpu/linear_model/penalized/_penalized_gamma.py +86 -0
statgpu/linear_model/penalized/_penalized_inverse_gaussian.py +62 -0
statgpu/linear_model/penalized/_penalized_linear.py +236 -0
statgpu/linear_model/penalized/_penalized_logistic.py +100 -0
statgpu/linear_model/penalized/_penalized_negative_binomial.py +65 -0
statgpu/linear_model/penalized/_penalized_poisson.py +62 -0
statgpu/linear_model/penalized/_penalized_tweedie.py +65 -0
statgpu/linear_model/penalized/_predict_mixin.py +182 -0
statgpu/linear_model/wrappers/__init__.py +31 -0
statgpu/linear_model/wrappers/_adaptive_lasso.py +63 -0
statgpu/linear_model/wrappers/_elasticnet.py +75 -0
statgpu/linear_model/wrappers/_gamma.py +67 -0
statgpu/linear_model/wrappers/_inverse_gaussian.py +47 -0
statgpu/linear_model/wrappers/_lasso.py +2124 -0
statgpu/linear_model/wrappers/_linear.py +1127 -0
statgpu/linear_model/wrappers/_logistic.py +1435 -0
statgpu/linear_model/wrappers/_mcp.py +58 -0
statgpu/linear_model/wrappers/_negative_binomial.py +58 -0
statgpu/linear_model/wrappers/_poisson.py +48 -0
statgpu/linear_model/wrappers/_ridge.py +166 -0
statgpu/linear_model/wrappers/_scad.py +58 -0
statgpu/linear_model/wrappers/_tweedie.py +57 -0
statgpu/metrics/__init__.py +21 -0
statgpu/metrics/_classification.py +591 -0
statgpu/nonparametric/__init__.py +50 -0
statgpu/nonparametric/kernel_methods/__init__.py +25 -0
statgpu/nonparametric/kernel_methods/_kernels.py +246 -0
statgpu/nonparametric/kernel_methods/_krr.py +234 -0
statgpu/nonparametric/kernel_methods/_krr_cv.py +380 -0
statgpu/nonparametric/kernel_smoothing/__init__.py +39 -0
statgpu/nonparametric/kernel_smoothing/_bandwidth_selection.py +1083 -0
statgpu/nonparametric/kernel_smoothing/_kde.py +761 -0
statgpu/nonparametric/kernel_smoothing/_kernel_common.py +348 -0
statgpu/nonparametric/kernel_smoothing/_kernel_regression.py +748 -0
statgpu/nonparametric/splines/__init__.py +5 -0
statgpu/nonparametric/splines/_bspline_basis.py +336 -0
statgpu/nonparametric/splines/_penalized.py +349 -0
statgpu/panel/__init__.py +19 -0
statgpu/panel/_covariance.py +140 -0
statgpu/panel/_fixed_effects.py +420 -0
statgpu/panel/_random_effects.py +385 -0
statgpu/panel/_utils.py +482 -0
statgpu/penalties/__init__.py +139 -0
statgpu/penalties/_adaptive_l1.py +313 -0
statgpu/penalties/_base.py +261 -0
statgpu/penalties/_categories.py +39 -0
statgpu/penalties/_elasticnet.py +98 -0
statgpu/penalties/_group_lasso.py +678 -0
statgpu/penalties/_group_mcp.py +553 -0
statgpu/penalties/_group_scad.py +605 -0
statgpu/penalties/_l1.py +107 -0
statgpu/penalties/_l2.py +77 -0
statgpu/penalties/_mcp.py +237 -0
statgpu/penalties/_scad.py +260 -0
statgpu/semiparametric/__init__.py +5 -0
statgpu/semiparametric/_gam.py +401 -0
statgpu/solvers/__init__.py +24 -0
statgpu/solvers/_admm.py +241 -0
statgpu/solvers/_constants.py +15 -0
statgpu/solvers/_convergence.py +6 -0
statgpu/solvers/_fista.py +436 -0
statgpu/solvers/_fista_bb.py +513 -0
statgpu/solvers/_fista_lla.py +541 -0
statgpu/solvers/_lbfgs.py +206 -0
statgpu/solvers/_newton.py +149 -0
statgpu/solvers/_utils.py +277 -0
statgpu/survival/__init__.py +14 -0
statgpu/survival/_cox.py +3974 -0
statgpu/survival/_cox_breslow_triton_kernel.py +106 -0
statgpu/survival/_cox_cv.py +1159 -0
statgpu/survival/_cox_efron_cuda.py +1280 -0
statgpu/survival/_cox_efron_triton.py +359 -0
statgpu/unsupervised/__init__.py +29 -0
statgpu/unsupervised/_agglomerative.py +307 -0
statgpu/unsupervised/_dbscan.py +263 -0
statgpu/unsupervised/_dbscan_cpu.pyx +125 -0
statgpu/unsupervised/_gmm.py +332 -0
statgpu/unsupervised/_incremental_pca.py +176 -0
statgpu/unsupervised/_kmeans.py +261 -0
statgpu/unsupervised/_minibatch_kmeans.py +299 -0
statgpu/unsupervised/_minibatch_nmf.py +252 -0
statgpu/unsupervised/_nmf.py +190 -0
statgpu/unsupervised/_pca.py +189 -0
statgpu/unsupervised/_truncated_svd.py +132 -0
statgpu/unsupervised/_tsne.py +192 -0
statgpu/unsupervised/_umap.py +224 -0
statgpu/unsupervised/_utils.py +134 -0
statgpu-0.1.0.dist-info/METADATA +245 -0
statgpu-0.1.0.dist-info/RECORD +168 -0
statgpu-0.1.0.dist-info/WHEEL +5 -0
statgpu-0.1.0.dist-info/licenses/LICENSE +199 -0
statgpu-0.1.0.dist-info/top_level.txt +1 -0

statgpu/anova/_oneway.py ADDED Viewed

@@ -0,0 +1,194 @@
+"""GPU-accelerated one-way ANOVA.
+Provides :func:`f_oneway`, a backend-agnostic replacement for
+``scipy.stats.f_oneway`` that can run on NumPy, CuPy, or PyTorch arrays.
+"""
+from __future__ import annotations
+__all__ = ["f_oneway"]
+from dataclasses import dataclass
+from typing import Any, Tuple, Union
+import numpy as np
+from statgpu.backends import _get_xp, _resolve_backend, _to_float_scalar, _to_numpy
+# ---------------------------------------------------------------------------
+# Result container
+# ---------------------------------------------------------------------------
+@dataclass
+class AnovaResult:
+    """Result of a one-way ANOVA.
+    Attributes
+    ----------
+    statistic : float
+        The F-statistic.
+    pvalue : float
+        P-value from the F-distribution survival function.
+    df_between : int
+        Degrees of freedom between groups (k - 1).
+    df_within : int
+        Degrees of freedom within groups (N - k).
+    eta_squared : float
+        Effect size: SSB / (SSB + SSW).
+    """
+    statistic: float
+    pvalue: float
+    df_between: int
+    df_within: int
+    eta_squared: float
+# ---------------------------------------------------------------------------
+# Core implementation
+# ---------------------------------------------------------------------------
+def f_oneway(
+    *groups: Any,
+    backend: str = "auto",
+    dtype: Any = None,
+) -> AnovaResult:
+    """Perform a one-way ANOVA.
+    Parameters
+    ----------
+    *groups : array-like
+        Two or more sample arrays, one per group.  Each must be 1-D (or
+        flattenable to 1-D).
+    backend : {'auto', 'numpy', 'cupy', 'torch'}, default='auto'
+        Compute backend.  ``'auto'`` inspects the input arrays and picks the
+        best match.
+    dtype : dtype or None, default=None
+        Float dtype for computation.  ``None`` uses ``float64``.
+        Pass ``float32`` for faster GPU computation on consumer GPUs.
+    Returns
+    -------
+    AnovaResult
+        Dataclass with ``statistic``, ``pvalue``, ``df_between``,
+        ``df_within``, and ``eta_squared``.
+    Raises
+    ------
+    ValueError
+        If fewer than 2 groups are supplied or any group has fewer than 1
+        observation.
+    Examples
+    --------
+    >>> import numpy as np
+    >>> from statgpu.anova import f_oneway
+    >>> g1 = np.array([5.1, 4.9, 5.0])
+    >>> g2 = np.array([6.2, 6.0, 6.3])
+    >>> g3 = np.array([7.1, 7.3, 7.0])
+    >>> result = f_oneway(g1, g2, g3)
+    >>> result.statistic  # doctest: +SKIP
+    114.54545454545453
+    """
+    if len(groups) < 2:
+        raise ValueError("f_oneway requires at least 2 groups")
+    # Resolve backend from input arrays
+    resolved = _resolve_backend(backend, *groups)
+    xp = _get_xp(resolved)
+    # Resolve dtype
+    float_dtype = dtype if dtype is not None else xp.float64
+    # Convert groups to flat arrays in the target backend
+    flat_groups = []
+    for g in groups:
+        arr = xp.asarray(g, dtype=float_dtype).ravel()
+        n_i = int(arr.shape[0])
+        if n_i < 1:
+            raise ValueError("each group must contain at least 1 observation")
+        flat_groups.append(arr)
+    k = len(flat_groups)
+    # Use first group as device reference for torch
+    ref = flat_groups[0]
+    group_sizes = xp.asarray([int(g.shape[0]) for g in flat_groups], dtype=float_dtype)
+    # Ensure group_sizes is on same device as groups (torch CUDA)
+    if hasattr(group_sizes, 'to') and hasattr(ref, 'device'):
+        group_sizes = group_sizes.to(device=ref.device)
+    N = _to_float_scalar(xp.sum(group_sizes))
+    if N <= k:
+        raise ValueError(
+            f"total observations ({int(N)}) must exceed number of groups ({k})"
+        )
+    # Group means — computed on device, single sync at the end
+    group_means = xp.empty(k, dtype=float_dtype)
+    if hasattr(group_means, 'to') and hasattr(ref, 'device'):
+        group_means = group_means.to(device=ref.device)
+    for i, g in enumerate(flat_groups):
+        group_means[i] = xp.sum(g) / g.shape[0]
+    # Grand mean (weighted by group sizes)
+    grand_mean = xp.sum(group_means * group_sizes) / N
+    # SSB (between-group sum of squares)
+    ssb = xp.sum(group_sizes * (group_means - grand_mean) ** 2)
+    # SSW (within-group sum of squares)
+    ssw = xp.zeros(1, dtype=float_dtype)
+    if hasattr(ssw, 'to') and hasattr(ref, 'device'):
+        ssw = ssw.to(device=ref.device)
+    for i, g in enumerate(flat_groups):
+        diff = g - group_means[i]
+        ssw = ssw + xp.sum(diff * diff)
+    # Single sync to CPU
+    ssb = _to_float_scalar(ssb)
+    ssw = _to_float_scalar(ssw)
+    df_between = k - 1
+    df_within = int(N) - k
+    # Edge case: no within-group variance
+    if ssw == 0.0:
+        if ssb == 0.0:
+            # All observations identical
+            return AnovaResult(
+                statistic=float("nan"),
+                pvalue=float("nan"),
+                df_between=df_between,
+                df_within=df_within,
+                eta_squared=float("nan"),
+            )
+        # Perfect separation
+        return AnovaResult(
+            statistic=float("inf"),
+            pvalue=0.0,
+            df_between=df_between,
+            df_within=df_within,
+            eta_squared=1.0,
+        )
+    ms_between = ssb / df_between
+    ms_within = ssw / df_within
+    f_stat = ms_between / ms_within
+    eta_squared = ssb / (ssb + ssw)
+    # P-value from F survival function via statgpu.inference
+    from statgpu.inference._distributions_backend import get_distribution
+    f_dist = get_distribution("f", backend=resolved)
+    pvalue_arr = f_dist.sf(f_stat, df_between, df_within)
+    pvalue = _to_float_scalar(pvalue_arr)
+    return AnovaResult(
+        statistic=f_stat,
+        pvalue=pvalue,
+        df_between=df_between,
+        df_within=df_within,
+        eta_squared=eta_squared,
+    )

statgpu/backends/__init__.py ADDED Viewed

@@ -0,0 +1,83 @@
+"""
+statgpu.backends – pluggable compute backends for array operations.
+Supported backends
+------------------
+* **NumpyBackend** – CPU, always available.
+* **CuPyBackend**  – CUDA GPU via CuPy (install ``statgpu[gpu11]`` or
+  ``statgpu[gpu12]``).
+* **TorchBackend** – CUDA GPU (or CPU) via PyTorch (install
+  ``statgpu[torch]``).
+Quick start
+-----------
+>>> from statgpu.backends import get_backend
+>>> backend = get_backend()        # auto-detects best available backend
+>>> xp = backend.xp                # array module (numpy / cupy / torch)
+>>> arr = backend.asarray([1, 2, 3])
+>>> backend.to_numpy(arr)
+array([1, 2, 3])
+Use ``get_backend(backend='cupy')`` or ``get_backend(backend='torch')`` to
+force a specific library.
+"""
+from ._base import BackendBase, _is_cupy_array, _is_torch_array, _resolve_backend
+from ._numpy import NumpyBackend
+from ._cupy import CuPyBackend
+from ._torch import TorchBackend
+from ._factory import get_backend
+from ._utils import (
+    _get_xp,
+    _to_numpy,
+    _to_float_scalar,
+    _get_torch_device_str,
+    _cupy_to_torch_dlpack,
+    _torch_to_cupy_dlpack,
+    _numpy_to_torch_tensor,
+    _move_torch_tensor,
+    _torch_dev,
+    _LINALG_ERRORS,
+    xp_zeros,
+    xp_eye,
+    xp_full,
+    xp_astype,
+    xp_asarray,
+    xp_empty,
+    xp_arange,
+    xp_ones,
+    xp_maximum,
+    xp_copy,
+    xp_cholesky_solve,
+)
+__all__ = [
+    "BackendBase",
+    "NumpyBackend",
+    "CuPyBackend",
+    "TorchBackend",
+    "get_backend",
+    "_is_cupy_array",
+    "_is_torch_array",
+    "_resolve_backend",
+    "_get_xp",
+    "_to_numpy",
+    "_to_float_scalar",
+    "_get_torch_device_str",
+    "_cupy_to_torch_dlpack",
+    "_torch_to_cupy_dlpack",
+    "_numpy_to_torch_tensor",
+    "_move_torch_tensor",
+    "_torch_dev",
+    "xp_zeros",
+    "xp_eye",
+    "xp_full",
+    "xp_astype",
+    "xp_asarray",
+    "xp_empty",
+    "xp_arange",
+    "xp_ones",
+    "xp_maximum",
+    "xp_copy",
+    "xp_cholesky_solve",
+]