PyPI - warpgbm - Versions diffs - 0.1.15__tar.gz → 0.1.16__tar.gz - Mend

warpgbm 0.1.15tar.gz → 0.1.16tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

{warpgbm-0.1.15/warpgbm.egg-info → warpgbm-0.1.16}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: warpgbm
-Version: 0.1.15
+Version: 0.1.16
 Summary: A fast GPU-accelerated Gradient Boosted Decision Tree library with PyTorch + CUDA
 License:                     GNU GENERAL PUBLIC LICENSE
                                Version 3, 29 June 2007
@@ -735,6 +735,17 @@ This installs from PyPI and also compiles CUDA code locally during installation.
 > pip install warpgbm --no-build-isolation
 > ```
+### Windows
+Thank you, ShatteredX, for providing working instructions for a Windows installation.
+```
+git clone https://github.com/jefferythewind/warpgbm.git
+cd warpgbm
+python setup.py bdist_wheel
+pip install .\dist\warpgbm-0.1.15-cp310-cp310-win_amd64.whl
+```
 Before either method, make sure you’ve installed PyTorch with GPU support:\
 [https://pytorch.org/get-started/locally/](https://pytorch.org/get-started/locally/)

{warpgbm-0.1.15 → warpgbm-0.1.16}/README.md RENAMED Viewed

@@ -47,6 +47,17 @@ This installs from PyPI and also compiles CUDA code locally during installation.
 > pip install warpgbm --no-build-isolation
 > ```
+### Windows
+Thank you, ShatteredX, for providing working instructions for a Windows installation.
+```
+git clone https://github.com/jefferythewind/warpgbm.git
+cd warpgbm
+python setup.py bdist_wheel
+pip install .\dist\warpgbm-0.1.15-cp310-cp310-win_amd64.whl
+```
 Before either method, make sure you’ve installed PyTorch with GPU support:\
 [https://pytorch.org/get-started/locally/](https://pytorch.org/get-started/locally/)

{warpgbm-0.1.15 → warpgbm-0.1.16}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "warpgbm"
-version = "0.1.15"
+version = "0.1.16"
 description = "A fast GPU-accelerated Gradient Boosted Decision Tree library with PyTorch + CUDA"
 readme = "README.md"
 requires-python = ">=3.8"

{warpgbm-0.1.15 → warpgbm-0.1.16}/tests/test_fit_predict_corr.py RENAMED Viewed

@@ -1,14 +1,12 @@
 import numpy as np
 from warpgbm import WarpGBM
+from sklearn.datasets import make_regression
 def test_fit_predict_correlation():
     np.random.seed(42)
-    N = 500
-    F = 5
-    X = np.random.randn(N, F).astype(np.float32)
-    true_weights = np.array([0.5, -1.0, 2.0, 0.0, 1.0])
-    noise = 0.1 * np.random.randn(N)
-    y = (X @ true_weights + noise).astype(np.float32)
+    N = 1_000_000
+    F = 100
+    X, y = make_regression(n_samples=N, n_features=F, noise=0.1, random_state=42)
     era = np.zeros(N, dtype=np.int32)
     corrs = []

warpgbm-0.1.16/version.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ 0.1.16

{warpgbm-0.1.15 → warpgbm-0.1.16}/warpgbm/core.py RENAMED Viewed

@@ -3,6 +3,8 @@ import numpy as np
 from sklearn.base import BaseEstimator, RegressorMixin
 from warpgbm.cuda import node_kernel
 from tqdm import tqdm
+from typing import Tuple
+from torch import Tensor
 histogram_kernels = {
     'hist1': node_kernel.compute_histogram,
@@ -10,6 +12,40 @@ histogram_kernels = {
     'hist3': node_kernel.compute_histogram3
 }
+@torch.jit.script
+def jit_find_best_split(
+    G: Tensor, H: Tensor,
+    lambda_l2: float,
+    lambda_l1: float,  # unused placeholder for now
+    min_split_gain: float,
+    min_child_weight: float
+) -> Tuple[int, int]:
+    F, B = G.size()
+    Bm1 = B - 1
+    eps = 0
+    GH = torch.stack([G, H], dim=0).cumsum(dim=2)  # [2, F, B]
+    GL, HL_raw = GH[0, :, :-1], GH[1, :, :-1]      # [F, B-1]
+    GP, HP = GH[0, :, -1:], GH[1, :, -1:]          # [F, 1]
+    H_R_raw = HP - HL_raw
+    # Validity mask using raw child hessians
+    valid = (HL_raw >= min_child_weight) & (H_R_raw >= min_child_weight)
+    # Closed-form gain
+    HL, HP = HL_raw + lambda_l2, HP + lambda_l2
+    num = (HP * GL - HL * GP).pow(2)
+    denom = HP * HL * (HP - HL) + eps
+    gain = torch.where(valid & (num / denom >= min_split_gain), num / denom, torch.full_like(num, -float("inf")))
+    gain_flat = gain.view(-1)
+    best_idx = torch.argmax(gain_flat)
+    if gain_flat[best_idx].item() == float('-inf'):
+        return -1, -1
+    return best_idx // Bm1, best_idx % Bm1
 class WarpGBM(BaseEstimator, RegressorMixin):
     def __init__(
         self,
@@ -24,6 +60,7 @@ class WarpGBM(BaseEstimator, RegressorMixin):
         threads_per_block=64,
         rows_per_thread=4,
         L2_reg = 1e-6,
+        L1_reg = 0.0,
         device = 'cuda'
     ):
         self.num_bins = num_bins
@@ -54,7 +91,7 @@ class WarpGBM(BaseEstimator, RegressorMixin):
         self.threads_per_block = threads_per_block
         self.rows_per_thread = rows_per_thread
         self.L2_reg = L2_reg
+        self.L1_reg = L1_reg
     def fit(self, X, y, era_id=None):
         if era_id is None:
@@ -121,20 +158,14 @@ class WarpGBM(BaseEstimator, RegressorMixin):
         return grad_hist, hess_hist
     def find_best_split(self, gradient_histogram, hessian_histogram):
-        node_kernel.compute_split(
-            gradient_histogram.contiguous(),
-            hessian_histogram.contiguous(),
-            self.num_features,
-            self.num_bins,
+        f,b = jit_find_best_split(
+            gradient_histogram,
+            hessian_histogram,
+            self.L2_reg,
+            self.L1_reg,
             self.min_split_gain,
             self.min_child_weight,
-            self.L2_reg,
-            self.out_feature,
-            self.out_bin
         )
-        f = int(self.out_feature[0])
-        b = int(self.out_bin[0])
         return (f, b)
     def grow_tree(self, gradient_histogram, hessian_histogram, node_indices, depth):
@@ -182,7 +213,7 @@ class WarpGBM(BaseEstimator, RegressorMixin):
         forest = [{} for _ in range(self.n_estimators)]
         self.training_loss = []
-        for i in range(self.n_estimators):
+        for i in tqdm( range(self.n_estimators) ):
             self.residual = self.Y_gpu - self.gradients
             self.root_gradient_histogram, self.root_hessian_histogram = \
@@ -195,8 +226,8 @@ class WarpGBM(BaseEstimator, RegressorMixin):
                 depth=0
             )
             forest[i] = tree
-            loss = ((self.Y_gpu - self.gradients) ** 2).mean().item()
-            self.training_loss.append(loss)
+            # loss = ((self.Y_gpu - self.gradients) ** 2).mean().item()
+            # self.training_loss.append(loss)
             # print(f"🌲 Tree {i+1}/{self.n_estimators} - MSE: {loss:.6f}")
         print("Finished training forest.")

{warpgbm-0.1.15 → warpgbm-0.1.16/warpgbm.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: warpgbm
-Version: 0.1.15
+Version: 0.1.16
 Summary: A fast GPU-accelerated Gradient Boosted Decision Tree library with PyTorch + CUDA
 License:                     GNU GENERAL PUBLIC LICENSE
                                Version 3, 29 June 2007
@@ -735,6 +735,17 @@ This installs from PyPI and also compiles CUDA code locally during installation.
 > pip install warpgbm --no-build-isolation
 > ```
+### Windows
+Thank you, ShatteredX, for providing working instructions for a Windows installation.
+```
+git clone https://github.com/jefferythewind/warpgbm.git
+cd warpgbm
+python setup.py bdist_wheel
+pip install .\dist\warpgbm-0.1.15-cp310-cp310-win_amd64.whl
+```
 Before either method, make sure you’ve installed PyTorch with GPU support:\
 [https://pytorch.org/get-started/locally/](https://pytorch.org/get-started/locally/)