PyPI - unifiedbooster - Versions diffs - 0.1.2__tar.gz → 0.2.0__tar.gz - Mend

unifiedbooster 0.1.2tar.gz → 0.2.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/PKG-INFO RENAMED Viewed

@@ -1,7 +1,7 @@
 Metadata-Version: 2.1
 Name: unifiedbooster
-Version: 0.1.2
-Summary: Call R functions from Python
+Version: 0.2.0
+Summary: Unified interface for Gradient Boosted Decision Trees
 Home-page: https://github.com/thierrymoudiki/unifiedbooster
 Author: T. Moudiki
 Author-email: thierry.moudiki@gmail.com
@@ -17,9 +17,11 @@ Classifier: Programming Language :: Python :: 3.7
 Classifier: Programming Language :: Python :: 3.8
 Requires-Python: >=3.6
 Requires-Dist: Cython
+Requires-Dist: numpy
 Requires-Dist: scikit-learn
 Requires-Dist: xgboost
 Requires-Dist: lightgbm
 Requires-Dist: catboost
+Requires-Dist: GPopt
 Unified interface for Gradient Boosted Decision Trees

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/setup.py RENAMED Viewed

@@ -10,7 +10,7 @@ from os import path
 subprocess.check_call(['pip', 'install', 'Cython'])
-__version__ = "0.1.2"
+__version__ = "0.2.0"
 here = path.abspath(path.dirname(__file__))
@@ -44,7 +44,7 @@ setup(
         'Programming Language :: Python :: 3.7',
         'Programming Language :: Python :: 3.8',
     ],
-    description="Call R functions from Python",
+    description="Unified interface for Gradient Boosted Decision Trees",
     entry_points={
         'console_scripts': [
             'unifiedbooster=unifiedbooster.cli:main',

unifiedbooster-0.2.0/unifiedbooster/gbdt.py ADDED Viewed

@@ -0,0 +1,68 @@
+import numpy as np
+from sklearn.base import BaseEstimator
+class GBDT(BaseEstimator):
+    def __init__(self,
+                 model_type='xgboost',
+                 n_estimators=100,
+                 learning_rate=0.1,
+                 max_depth=3,
+                 rowsample=1.0,
+                 colsample=1.0,
+                 verbose=0,
+                 seed=123,
+                 **kwargs):
+        self.model_type = model_type
+        self.n_estimators = n_estimators
+        self.learning_rate = learning_rate
+        self.max_depth = max_depth
+        self.rowsample = rowsample
+        self.colsample = colsample
+        self.verbose = verbose
+        self.seed = seed
+        if self.model_type == "xgboost":
+            self.params = {
+                'n_estimators': self.n_estimators,
+                'learning_rate': self.learning_rate,
+                'subsample': self.rowsample,
+                'colsample_bynode': self.colsample,
+                'max_depth': self.max_depth,
+                'verbosity': self.verbose,
+                'seed': self.seed,
+                **kwargs
+            }
+        elif self.model_type == "lightgbm":
+             verbose = self.verbose - 1 if self.verbose==0 else self.verbose
+             self.params = {
+                'n_estimators': self.n_estimators,
+                'learning_rate': self.learning_rate,
+                'subsample': self.rowsample,
+                'feature_fraction_bynode': self.colsample,
+                'max_depth': self.max_depth,
+                'verbose': verbose, # keep this way
+                'seed': self.seed,
+                **kwargs
+            }
+        elif self.model_type == "catboost":
+             self.params = {
+                'iterations': self.n_estimators,
+                'learning_rate': self.learning_rate,
+                'subsample': self.rowsample,
+                'rsm': self.colsample,
+                'depth': self.max_depth,
+                'verbose': self.verbose,
+                'random_seed': self.seed,
+                **kwargs
+            }
+    def fit(self, X, y, **kwargs):
+        if getattr(self, "type_fit") == "classification":
+            self.classes_ = np.unique(y) # for compatibility with sklearn
+            self.n_classes_ = len(self.classes_)  # for compatibility with sklearn
+        return getattr(self, "model").fit(X, y, **kwargs)
+    def predict(self, X):
+        return getattr(self, "model").predict(X)

unifiedbooster-0.2.0/unifiedbooster/gbdt_classification.py ADDED Viewed

@@ -0,0 +1,106 @@
+from .gbdt import GBDT
+from sklearn.base import ClassifierMixin
+from xgboost import XGBClassifier
+from catboost import CatBoostClassifier
+from lightgbm import LGBMClassifier
+class GBDTClassifier(GBDT, ClassifierMixin):
+    """GBDT Classification model
+    Attributes:
+        n_estimators: int
+            maximum number of trees that can be built
+        learning_rate: float
+            shrinkage rate; used for reducing the gradient step
+        rowsample: float
+            subsample ratio of the training instances
+        colsample: float
+            percentage of features to use at each node split
+        verbose: int
+            controls verbosity (default=0)
+        seed: int
+            reproducibility seed
+    Examples:
+    ```python
+    import unifiedbooster as ub
+    from sklearn.datasets import load_iris
+    from sklearn.model_selection import train_test_split
+    from sklearn.metrics import accuracy_score
+    # Load dataset
+    iris = load_iris()
+    X, y = iris.data, iris.target
+    # Split dataset into training and testing sets
+    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
+    # Initialize the unified regressor (example with XGBoost)
+    regressor1 = ub.GBDTClassifier(model_type='xgboost')
+    #regressor2 = ub.GBDTClassifier(model_type='catboost')
+    regressor3 = ub.GBDTClassifier(model_type='lightgbm')
+    # Fit the model
+    regressor1.fit(X_train, y_train)
+    #regressor2.fit(X_train, y_train)
+    regressor3.fit(X_train, y_train)
+    # Predict on the test set
+    y_pred1 = regressor1.predict(X_test)
+    #y_pred2 = regressor2.predict(X_test)
+    y_pred3 = regressor3.predict(X_test)
+    # Evaluate the model
+    accuracy1 = accuracy_score(y_test, y_pred1)
+    #accuracy2 = accuracy_score(y_test, y_pred2)
+    accuracy3 = accuracy_score(y_test, y_pred3)
+    print(f"Classification Accuracy xgboost: {accuracy1:.2f}")
+    #print(f"Classification Accuracy catboost: {accuracy2:.2f}")
+    print(f"Classification Accuracy lightgbm: {accuracy3:.2f}")
+    ```
+    """
+    def __init__(self,
+                 model_type='xgboost',
+                 n_estimators=100,
+                 learning_rate=0.1,
+                 max_depth=3,
+                 rowsample=1.0,
+                 colsample=1.0,
+                 verbose=0,
+                 seed=123,
+                 **kwargs):
+        self.type_fit = "classification"
+        super().__init__(
+            model_type=model_type,
+            n_estimators=n_estimators,
+            learning_rate=learning_rate,
+            max_depth=max_depth,
+            rowsample=rowsample,
+            colsample=colsample,
+            verbose=verbose,
+            seed=seed,
+            **kwargs
+        )
+        if model_type == 'xgboost':
+            self.model = XGBClassifier(**self.params)
+        elif model_type == 'catboost':
+            self.model = CatBoostClassifier(**self.params)
+        elif model_type == 'lightgbm':
+            self.model = LGBMClassifier(**self.params)
+        else:
+            raise ValueError(f"Unknown model_type: {model_type}")
+    def predict_proba(self, X):
+        return self.model.predict_proba(X)

unifiedbooster-0.2.0/unifiedbooster/gbdt_regression.py ADDED Viewed

@@ -0,0 +1,103 @@
+from .gbdt import GBDT
+from sklearn.base import RegressorMixin
+from xgboost import XGBRegressor
+from catboost import CatBoostRegressor
+from lightgbm import LGBMRegressor
+class GBDTRegressor(GBDT, RegressorMixin):
+    """GBDT Regression model
+    Attributes:
+        n_estimators: int
+            maximum number of trees that can be built
+        learning_rate: float
+            shrinkage rate; used for reducing the gradient step
+        rowsample: float
+            subsample ratio of the training instances
+        colsample: float
+            percentage of features to use at each node split
+        verbose: int
+            controls verbosity (default=0)
+        seed: int
+            reproducibility seed
+    Examples:
+    ```python
+    import unifiedbooster as ub
+    from sklearn.datasets import fetch_california_housing
+    from sklearn.model_selection import train_test_split
+    from sklearn.metrics import mean_squared_error
+    # Load dataset
+    housing = fetch_california_housing()
+    X, y = housing.data, housing.target
+    # Split dataset into training and testing sets
+    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
+    # Initialize the unified regressor (example with XGBoost)
+    regressor1 = ub.GBDTRegressor(model_type='xgboost')
+    #regressor2 = ub.GBDTRegressor(model_type='catboost')
+    regressor3 = ub.GBDTRegressor(model_type='lightgbm')
+    # Fit the model
+    regressor1.fit(X_train, y_train)
+    #regressor2.fit(X_train, y_train)
+    regressor3.fit(X_train, y_train)
+    # Predict on the test set
+    y_pred1 = regressor1.predict(X_test)
+    #y_pred2 = regressor2.predict(X_test)
+    y_pred3 = regressor3.predict(X_test)
+    # Evaluate the model
+    mse1 = mean_squared_error(y_test, y_pred1)
+    #mse2 = mean_squared_error(y_test, y_pred2)
+    mse3 = mean_squared_error(y_test, y_pred3)
+    print(f"Regression Mean Squared Error xgboost: {mse1:.2f}")
+    #print(f"Regression Mean Squared Error catboost: {mse2:.2f}")
+    print(f"Regression Mean Squared Error lightgbm: {mse3:.2f}")
+    ```
+    """
+    def __init__(self,
+                 model_type='xgboost',
+                 n_estimators=100,
+                 learning_rate=0.1,
+                 max_depth=3,
+                 rowsample=1.0,
+                 colsample=1.0,
+                 verbose=0,
+                 seed=123,
+                 **kwargs):
+        self.type_fit = "regression"
+        super().__init__(
+            model_type=model_type,
+            n_estimators=n_estimators,
+            learning_rate=learning_rate,
+            max_depth=max_depth,
+            rowsample=rowsample,
+            colsample=colsample,
+            verbose=verbose,
+            seed=seed,
+            **kwargs
+        )
+        if model_type == 'xgboost':
+            self.model = XGBRegressor(**self.params)
+        elif model_type == 'catboost':
+            self.model = CatBoostRegressor(**self.params)
+        elif model_type == 'lightgbm':
+            self.model = LGBMRegressor(**self.params)
+        else:
+            raise ValueError(f"Unknown model_type: {model_type}")

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/unifiedbooster.egg-info/PKG-INFO RENAMED Viewed

@@ -1,7 +1,7 @@
 Metadata-Version: 2.1
 Name: unifiedbooster
-Version: 0.1.2
-Summary: Call R functions from Python
+Version: 0.2.0
+Summary: Unified interface for Gradient Boosted Decision Trees
 Home-page: https://github.com/thierrymoudiki/unifiedbooster
 Author: T. Moudiki
 Author-email: thierry.moudiki@gmail.com
@@ -17,9 +17,11 @@ Classifier: Programming Language :: Python :: 3.7
 Classifier: Programming Language :: Python :: 3.8
 Requires-Python: >=3.6
 Requires-Dist: Cython
+Requires-Dist: numpy
 Requires-Dist: scikit-learn
 Requires-Dist: xgboost
 Requires-Dist: lightgbm
 Requires-Dist: catboost
+Requires-Dist: GPopt
 Unified interface for Gradient Boosted Decision Trees

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/unifiedbooster.egg-info/SOURCES.txt RENAMED Viewed

@@ -1,6 +1,7 @@
 README.md
 setup.py
 unifiedbooster/__init__.py
+unifiedbooster/gbdt.py
 unifiedbooster/gbdt_classification.py
 unifiedbooster/gbdt_regression.py
 unifiedbooster.egg-info/PKG-INFO

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/unifiedbooster.egg-info/requires.txt RENAMED Viewed

@@ -1,5 +1,7 @@
 Cython
+numpy
 scikit-learn
 xgboost
 lightgbm
 catboost
+GPopt

unifiedbooster-0.1.2/unifiedbooster/gbdt_classification.py DELETED Viewed

@@ -1,81 +0,0 @@
-from sklearn.base import BaseEstimator, ClassifierMixin
-from xgboost import XGBClassifier
-from catboost import CatBoostClassifier
-from lightgbm import LGBMClassifier
-class GBDTClassifier(BaseEstimator, ClassifierMixin):
-    def __init__(self, model_type='xgboost',
-                 n_estimators=100,
-                 learning_rate=0.1,
-                 max_depth=3,
-                 subsample=1.0,
-                 verbosity=0,
-                 **kwargs):
-        self.model_type = model_type
-        self.n_estimators = n_estimators
-        self.learning_rate = learning_rate
-        self.max_depth = max_depth
-        self.subsample = subsample
-        self.verbosity = verbosity
-        # xgboost -----
-        # n_estimators
-        # learning_rate
-        # subsample
-        # max_depth
-        # lightgbm -----
-        # n_estimators
-        # learning_rate
-        # bagging_fraction
-        # max_depth
-        # catboost -----
-        # iterations
-        # learning_rate
-        # rsm
-        # depth
-        if self.model_type == "xgboost":
-            self.params = {
-                'n_estimators': self.n_estimators,
-                'learning_rate': self.learning_rate,
-                'subsample': self.subsample,
-                'max_depth': self.max_depth,
-                'verbosity': self.verbosity,
-                **kwargs
-            }
-        elif self.model_type == "lightgbm":
-             verbose = self.verbosity - 1 if self.verbosity==0 else self.verbosity
-             self.params = {
-                'n_estimators': self.n_estimators,
-                'learning_rate': self.learning_rate,
-                'bagging_fraction': self.subsample,
-                'max_depth': self.max_depth,
-                'verbose': verbose,
-                **kwargs
-            }
-        elif self.model_type == "catboost":
-             self.params = {
-                'iterations': self.n_estimators,
-                'learning_rate': self.learning_rate,
-                'rsm': self.subsample,
-                'depth': self.max_depth,
-                'verbose': self.verbosity,
-                **kwargs
-            }
-        if model_type == 'xgboost':
-            self.model = XGBClassifier(**self.params)
-        elif model_type == 'catboost':
-            self.model = CatBoostClassifier(**self.params)
-        elif model_type == 'lightgbm':
-            self.model = LGBMClassifier(**self.params)
-        else:
-            raise ValueError(f"Unknown model_type: {model_type}")
-    def fit(self, X, y, **kwargs):
-        return self.model.fit(X, y, **kwargs)
-    def predict(self, X):
-        return self.model.predict(X)
-    def predict_proba(self, X):
-        return self.model.predict_proba(X)

unifiedbooster-0.1.2/unifiedbooster/gbdt_regression.py DELETED Viewed

@@ -1,78 +0,0 @@
-from sklearn.base import BaseEstimator, RegressorMixin
-from xgboost import XGBRegressor
-from catboost import CatBoostRegressor
-from lightgbm import LGBMRegressor
-class GBDTRegressor(BaseEstimator, RegressorMixin):
-    def __init__(self, model_type='xgboost',
-                 n_estimators=100,
-                 learning_rate=0.1,
-                 max_depth=3,
-                 subsample=1.0,
-                 verbosity=0,
-                 **kwargs):
-        self.model_type = model_type
-        self.n_estimators = n_estimators
-        self.learning_rate = learning_rate
-        self.max_depth = max_depth
-        self.subsample = subsample
-        self.verbosity = verbosity
-        # xgboost -----
-        # n_estimators
-        # learning_rate
-        # subsample
-        # max_depth
-        # lightgbm -----
-        # n_estimators
-        # learning_rate
-        # bagging_fraction
-        # max_depth
-        # catboost -----
-        # iterations
-        # learning_rate
-        # rsm
-        # depth
-        if self.model_type == "xgboost":
-            self.params = {
-                'n_estimators': self.n_estimators,
-                'learning_rate': self.learning_rate,
-                'subsample': self.subsample,
-                'max_depth': self.max_depth,
-                'verbosity': self.verbosity,
-                **kwargs
-            }
-        elif self.model_type == "lightgbm":
-             verbose = self.verbosity - 1 if self.verbosity==0 else self.verbosity
-             self.params = {
-                'n_estimators': self.n_estimators,
-                'learning_rate': self.learning_rate,
-                'bagging_fraction': self.subsample,
-                'max_depth': self.max_depth,
-                'verbose': verbose,
-                **kwargs
-            }
-        elif self.model_type == "catboost":
-             self.params = {
-                'iterations': self.n_estimators,
-                'learning_rate': self.learning_rate,
-                'rsm': self.subsample,
-                'depth': self.max_depth,
-                'verbose': self.verbosity,
-                **kwargs
-            }
-        if model_type == 'xgboost':
-            self.model = XGBRegressor(**self.params)
-        elif model_type == 'catboost':
-            self.model = CatBoostRegressor(**self.params)
-        elif model_type == 'lightgbm':
-            self.model = LGBMRegressor(**self.params)
-        else:
-            raise ValueError(f"Unknown model_type: {model_type}")
-    def fit(self, X, y, **kwargs):
-        return self.model.fit(X, y, **kwargs)
-    def predict(self, X):
-        return self.model.predict(X)

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/README.md RENAMED Viewed

File without changes

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/setup.cfg RENAMED Viewed

File without changes

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/unifiedbooster/__init__.py RENAMED Viewed

File without changes

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/unifiedbooster.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/unifiedbooster.egg-info/entry_points.txt RENAMED Viewed

File without changes

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/unifiedbooster.egg-info/not-zip-safe RENAMED Viewed

File without changes

{unifiedbooster-0.1.2 → unifiedbooster-0.2.0}/unifiedbooster.egg-info/top_level.txt RENAMED Viewed

File without changes

unifiedbooster 0.1.2__tar.gz → 0.2.0__tar.gz

unifiedbooster 0.1.2tar.gz → 0.2.0tar.gz