PyPI - cv-score-predict - Versions diffs - 0.1.1__tar.gz - Mend

cv-score-predict 0.1.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

cv_score_predict-0.1.1/LICENSE +9 -0
cv_score_predict-0.1.1/MANIFEST.in +2 -0
cv_score_predict-0.1.1/PKG-INFO +170 -0
cv_score_predict-0.1.1/README.md +145 -0
cv_score_predict-0.1.1/cv_score_predict/__init__.py +4 -0
cv_score_predict-0.1.1/cv_score_predict/core.py +404 -0
cv_score_predict-0.1.1/cv_score_predict.egg-info/PKG-INFO +170 -0
cv_score_predict-0.1.1/cv_score_predict.egg-info/SOURCES.txt +13 -0
cv_score_predict-0.1.1/cv_score_predict.egg-info/dependency_links.txt +1 -0
cv_score_predict-0.1.1/cv_score_predict.egg-info/requires.txt +6 -0
cv_score_predict-0.1.1/cv_score_predict.egg-info/top_level.txt +2 -0
cv_score_predict-0.1.1/pyproject.toml +61 -0
cv_score_predict-0.1.1/setup.cfg +4 -0
cv_score_predict-0.1.1/tests/test_cv_score_predict.py +44 -0
cv_score_predict-0.1.1/tests/test_regression_no_processor_binary_output.py +27 -0

cv_score_predict-0.1.1/LICENSE ADDED Viewed

@@ -0,0 +1,9 @@
+MIT License
+Copyright (c) 2026 Danu ANDRIES
+Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

cv_score_predict-0.1.1/MANIFEST.in ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ exclude .ipynb .txt
2	+ recursive-exclude . catboost

cv_score_predict-0.1.1/PKG-INFO ADDED Viewed

@@ -0,0 +1,170 @@
+Metadata-Version: 2.4
+Name: cv-score-predict
+Version: 0.1.1
+Summary: Cross-validated ensemble prediction with LGBM, XGBoost, and CatBoost — with safe categorical handling, multi-seed averaging, and artifact return.
+Author-email: Danu ANDRIES <danu@andries.lu>
+License: MIT
+Project-URL: Homepage, https://github.com/Karabush/cv-score-predict
+Project-URL: Repository, https://github.com/Karabush/cv-score-predict
+Project-URL: Documentation, https://github.com/Karabush/cv-score-predict#readme
+Keywords: cross-validation,ensemble learning,model averaging,LightGBM,XGBoost,CatBoost,categorical encoding,OrdinalEncoder,out-of-fold prediction,OOF,multi-seed CV,repeated cross-validation,early stopping,scikit-learn compatible,pandas,machine learning,classification,regression,model validation,kaggle,safe preprocessing,data leakage prevention,boosting ensemble
+Classifier: Programming Language :: Python :: 3
+Classifier: Intended Audience :: Developers
+Classifier: Intended Audience :: Science/Research
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Requires-Python: >=3.9
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: numpy>=1.21
+Requires-Dist: pandas>=1.3
+Requires-Dist: scikit-learn>=1.4
+Requires-Dist: lightgbm>=3.3
+Requires-Dist: xgboost>=1.7
+Requires-Dist: catboost>=1.2
+Dynamic: license-file
+# cv-score-predict
+A robust utility for **cross-validated ensemble prediction** with LightGBM, XGBoost and CatBoost. Handles categorical features safely, supports custom preprocessing pipelines, repeated CV over multiple seeds, early stopping, and returns out-of-fold (OOF) predictions, test predictions, trained models, and fitted encoder — all in one call.
+Designed for **kagglers, ML engineers, and data scientists** who need reliable, leakage-free CV with minimal boilerplate.
+---
+## ✨ Key Features
+- **Multi-model ensembling**: Train and average predictions from LGBM, XGBoost and CatBoost in a single CV run.
+- **Native categorical support**: Automatically encodes string/categorical columns with `OrdinalEncoder` and configures models (e.g., `cat_features` for CatBoost, `enable_categorical` for XGBoost).
+- **Safe preprocessing**: Integrates any scikit-learn-compatible `processor` pipeline (e.g., `ColumnTransformer`, `Pipeline`) — fitted **per fold** to prevent data leakage.
+- **Repeated CV**: Average results over multiple random seeds for stable metrics.
+- **Early stopping**: Enabled by default for all models using fold-wise validation.
+- **Full artifact return**: Get OOF predictions, test predictions, trained models, and fitted `OrdinalEncoder` for later use.
+---
+## 📥 Parameters
+| Parameter | Type | Default | Description |
+|----------|------|--------|-------------|
+| `X` | `pd.DataFrame` | — | Training features. |
+| `y` | `Union[pd.Series, np.ndarray]` | — | Target values. |
+| `X_test` | `Optional[pd.DataFrame]` | `None` | Test set for final prediction. If `None`, no test predictions are returned. |
+| `pred_type` | `str` | — | Either `'classification'` or `'regression'` (**required**). |
+| `processor` | `Optional[object]` | `None` | Preprocessing pipeline with `fit_transform` and `transform` methods. Must return a `pd.DataFrame` (use `set_output(transform='pandas')`). If `None`, features are passed through unchanged. |
+| `process_categorical` | `bool` | `True` | If `True`, object/category columns are encoded with `OrdinalEncoder` (using `-1` for missing/unseen) and converted to pandas `category` dtype for model compatibility. |
+| `models` | `Union[List[str], str]` | `('lgb', 'xgb', 'cb')` | Models to ensemble. Supported: `'lgb'` (LightGBM), `'xgb'` (XGBoost), `'cb'` (CatBoost). |
+| `params_dict` | `Optional[Dict[str, dict]]` | `None` | Model-specific hyperparameters. Keys: model names; values: param dicts. |
+| `scoring_dict` | `Optional[Dict[str, Callable]]` | `None` | Metrics for evaluation. Keys: metric names; values: scoring functions (e.g., `roc_auc_score`). Defaults: `{'roc_auc': roc_auc_score}` (classification), `{'rmse': rmse_fn}` (regression). |
+| `decision_threshold` | `float` | `0.5` | Threshold to convert probabilities to class labels (classification only). |
+| `n_splits` | `int` | `5` | Number of cross-validation folds. |
+| `random_state` | `Union[int, List[int]]` | `42` | Seed(s) for reproducibility. If a list, CV is repeated for each seed and results are averaged. |
+| `early_stopping_rounds` | `int` | `50` | Early stopping rounds for boosting models (if not overridden in `params_dict`). |
+| `verbose` | `int` | `2` | Logging level: `2` = full per-fold details, `1` = final summary, `0` = silent. |
+| `return_trained` | `bool` | `False` | If `True`, returns list of trained model instances (one per model × fold × seed). |
+| `return_oe` | `bool` | `False` | If `True` and `process_categorical=True`, returns the fitted `OrdinalEncoder`. |
+| `predict_proba` | `bool` | `True` | For classification: if `True`, return probabilities; if `False`, return binary labels (using `decision_threshold`). Ignored for regression. |
+---
+## 🚀 Installation
+```bash
+pip install cv-score-predict
+```
+Requirements:
+* Python ≥ 3.8
+* Dependencies (automatically installed):
+numpy, pandas, scikit-learn ≥1.4, lightgbm, xgboost, catboost
+---
+## 📌 Basic Usage
+```python
+import pandas as pd
+import numpy as np
+from sklearn.preprocessing import StandardScaler
+from sklearn.compose import make_column_transformer
+from cv_score_predict import cv_score_predict
+# Simulate data
+X = pd.DataFrame({
+    "num": [1, 2, 3, 4, 5, 6, 7, 8],
+    "cat": ["A", "B", "A", "C", "B", "A", "C", "D"]
+})
+y = [0, 1, 0, 1, 1, 0, 1, 0]
+X_test = pd.DataFrame({"num": [9, 10], "cat": ["B", "E"]})
+# Optional processor (applied per fold!)
+processor = make_column_transformer(
+    (StandardScaler(), ["num"]),
+    remainder="passthrough"
+)
+# Run CV with 3 seeds → results averaged over seeds & folds
+oof_pred, test_pred, _, _ = cv_score_predict(
+    X=X,
+    y=y,
+    X_test=X_test,
+    pred_type="classification",
+    processor=processor,
+    models=["lgb", "xgb"],
+    process_categorical=True,
+    random_state=[42, 123, 999],
+    n_splits=3,
+    verbose=2,
+)
+```
+Output will show scores per seed, then final averaged metrics.
+---
+## 🔧 Advanced Usage: Reuse Artifacts for New Data
+```python
+# Step 1: Run CV and return artifacts
+oof, _, trained_models, oe = cv_score_predict(
+    X,
+    y,
+    X_test=None,  # we'll predict manually
+    pred_type="classification",
+    processor=processor,
+    models=["lgb", "cb"],
+    process_categorical=True,
+    random_state=[42, 123],
+    n_splits=5,
+    return_trained=True,
+    return_oe=True,
+)
+# Step 2: For deployment: refit processor on FULL TRAINING data
+# First: encode categoricals using returned oe
+cat_cols = ["cat"]
+X_full = X.copy()
+X_full[cat_cols] = oe.transform(X_full[cat_cols]).astype('category')
+X_new = pd.DataFrame({"num": [7, 8], "cat": [None, "A"]})
+# Fit processor on full encoded data
+processor = make_column_transformer(
+    (StandardScaler(), ["num"]),
+    remainder="passthrough"
+)
+processor.fit(X_full)
+# Apply to new data
+X_new_proc = X_new.copy()
+X_new_proc[cat_cols] = oe.transform(X_new_proc[cat_cols]).astype('category')
+X_new_proc = processor.transform(X_new_proc)
+# Predict with all trained models and average
+preds = [model.predict_proba(X_new_proc)[:, 1] for model in trained_models]
+final_pred = np.mean(preds, axis=0)
+```
+## 📝 Notes
+Categorical columns are encoded with OrdinalEncoder(dtype=np.int32) and converted to category dtype for model compatibility.
+Always use set_output(transform="pandas") in sklearn pipelines to preserve dtypes.
+The processor used in CV is refit on each fold to prevent data leakage, so there is no single global version. For deployment, refit your preprocessing pipeline on the full training set (as shown in the advanced example).
+## 📄 License
+This project is licensed under the MIT License.
+See the LICENSE file for details.

cv_score_predict-0.1.1/README.md ADDED Viewed

@@ -0,0 +1,145 @@
+# cv-score-predict
+A robust utility for **cross-validated ensemble prediction** with LightGBM, XGBoost and CatBoost. Handles categorical features safely, supports custom preprocessing pipelines, repeated CV over multiple seeds, early stopping, and returns out-of-fold (OOF) predictions, test predictions, trained models, and fitted encoder — all in one call.
+Designed for **kagglers, ML engineers, and data scientists** who need reliable, leakage-free CV with minimal boilerplate.
+---
+## ✨ Key Features
+- **Multi-model ensembling**: Train and average predictions from LGBM, XGBoost and CatBoost in a single CV run.
+- **Native categorical support**: Automatically encodes string/categorical columns with `OrdinalEncoder` and configures models (e.g., `cat_features` for CatBoost, `enable_categorical` for XGBoost).
+- **Safe preprocessing**: Integrates any scikit-learn-compatible `processor` pipeline (e.g., `ColumnTransformer`, `Pipeline`) — fitted **per fold** to prevent data leakage.
+- **Repeated CV**: Average results over multiple random seeds for stable metrics.
+- **Early stopping**: Enabled by default for all models using fold-wise validation.
+- **Full artifact return**: Get OOF predictions, test predictions, trained models, and fitted `OrdinalEncoder` for later use.
+---
+## 📥 Parameters
+| Parameter | Type | Default | Description |
+|----------|------|--------|-------------|
+| `X` | `pd.DataFrame` | — | Training features. |
+| `y` | `Union[pd.Series, np.ndarray]` | — | Target values. |
+| `X_test` | `Optional[pd.DataFrame]` | `None` | Test set for final prediction. If `None`, no test predictions are returned. |
+| `pred_type` | `str` | — | Either `'classification'` or `'regression'` (**required**). |
+| `processor` | `Optional[object]` | `None` | Preprocessing pipeline with `fit_transform` and `transform` methods. Must return a `pd.DataFrame` (use `set_output(transform='pandas')`). If `None`, features are passed through unchanged. |
+| `process_categorical` | `bool` | `True` | If `True`, object/category columns are encoded with `OrdinalEncoder` (using `-1` for missing/unseen) and converted to pandas `category` dtype for model compatibility. |
+| `models` | `Union[List[str], str]` | `('lgb', 'xgb', 'cb')` | Models to ensemble. Supported: `'lgb'` (LightGBM), `'xgb'` (XGBoost), `'cb'` (CatBoost). |
+| `params_dict` | `Optional[Dict[str, dict]]` | `None` | Model-specific hyperparameters. Keys: model names; values: param dicts. |
+| `scoring_dict` | `Optional[Dict[str, Callable]]` | `None` | Metrics for evaluation. Keys: metric names; values: scoring functions (e.g., `roc_auc_score`). Defaults: `{'roc_auc': roc_auc_score}` (classification), `{'rmse': rmse_fn}` (regression). |
+| `decision_threshold` | `float` | `0.5` | Threshold to convert probabilities to class labels (classification only). |
+| `n_splits` | `int` | `5` | Number of cross-validation folds. |
+| `random_state` | `Union[int, List[int]]` | `42` | Seed(s) for reproducibility. If a list, CV is repeated for each seed and results are averaged. |
+| `early_stopping_rounds` | `int` | `50` | Early stopping rounds for boosting models (if not overridden in `params_dict`). |
+| `verbose` | `int` | `2` | Logging level: `2` = full per-fold details, `1` = final summary, `0` = silent. |
+| `return_trained` | `bool` | `False` | If `True`, returns list of trained model instances (one per model × fold × seed). |
+| `return_oe` | `bool` | `False` | If `True` and `process_categorical=True`, returns the fitted `OrdinalEncoder`. |
+| `predict_proba` | `bool` | `True` | For classification: if `True`, return probabilities; if `False`, return binary labels (using `decision_threshold`). Ignored for regression. |
+---
+## 🚀 Installation
+```bash
+pip install cv-score-predict
+```
+Requirements:
+* Python ≥ 3.8
+* Dependencies (automatically installed):
+numpy, pandas, scikit-learn ≥1.4, lightgbm, xgboost, catboost
+---
+## 📌 Basic Usage
+```python
+import pandas as pd
+import numpy as np
+from sklearn.preprocessing import StandardScaler
+from sklearn.compose import make_column_transformer
+from cv_score_predict import cv_score_predict
+# Simulate data
+X = pd.DataFrame({
+    "num": [1, 2, 3, 4, 5, 6, 7, 8],
+    "cat": ["A", "B", "A", "C", "B", "A", "C", "D"]
+})
+y = [0, 1, 0, 1, 1, 0, 1, 0]
+X_test = pd.DataFrame({"num": [9, 10], "cat": ["B", "E"]})
+# Optional processor (applied per fold!)
+processor = make_column_transformer(
+    (StandardScaler(), ["num"]),
+    remainder="passthrough"
+)
+# Run CV with 3 seeds → results averaged over seeds & folds
+oof_pred, test_pred, _, _ = cv_score_predict(
+    X=X,
+    y=y,
+    X_test=X_test,
+    pred_type="classification",
+    processor=processor,
+    models=["lgb", "xgb"],
+    process_categorical=True,
+    random_state=[42, 123, 999],
+    n_splits=3,
+    verbose=2,
+)
+```
+Output will show scores per seed, then final averaged metrics.
+---
+## 🔧 Advanced Usage: Reuse Artifacts for New Data
+```python
+# Step 1: Run CV and return artifacts
+oof, _, trained_models, oe = cv_score_predict(
+    X,
+    y,
+    X_test=None,  # we'll predict manually
+    pred_type="classification",
+    processor=processor,
+    models=["lgb", "cb"],
+    process_categorical=True,
+    random_state=[42, 123],
+    n_splits=5,
+    return_trained=True,
+    return_oe=True,
+)
+# Step 2: For deployment: refit processor on FULL TRAINING data
+# First: encode categoricals using returned oe
+cat_cols = ["cat"]
+X_full = X.copy()
+X_full[cat_cols] = oe.transform(X_full[cat_cols]).astype('category')
+X_new = pd.DataFrame({"num": [7, 8], "cat": [None, "A"]})
+# Fit processor on full encoded data
+processor = make_column_transformer(
+    (StandardScaler(), ["num"]),
+    remainder="passthrough"
+)
+processor.fit(X_full)
+# Apply to new data
+X_new_proc = X_new.copy()
+X_new_proc[cat_cols] = oe.transform(X_new_proc[cat_cols]).astype('category')
+X_new_proc = processor.transform(X_new_proc)
+# Predict with all trained models and average
+preds = [model.predict_proba(X_new_proc)[:, 1] for model in trained_models]
+final_pred = np.mean(preds, axis=0)
+```
+## 📝 Notes
+Categorical columns are encoded with OrdinalEncoder(dtype=np.int32) and converted to category dtype for model compatibility.
+Always use set_output(transform="pandas") in sklearn pipelines to preserve dtypes.
+The processor used in CV is refit on each fold to prevent data leakage, so there is no single global version. For deployment, refit your preprocessing pipeline on the full training set (as shown in the advanced example).
+## 📄 License
+This project is licensed under the MIT License.
+See the LICENSE file for details.

cv_score_predict-0.1.1/cv_score_predict/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+from .core import cv_score_predict
+__version__ = "0.1.0"
+__all__ = ["cv_score_predict"]

cv_score_predict-0.1.1/cv_score_predict/core.py ADDED Viewed

@@ -0,0 +1,404 @@
+from typing import (
+    Union, List, Dict, Tuple, Optional, Callable, Any, Literal, TypeVar
+)
+import numpy as np
+import pandas as pd
+import lightgbm as lgb
+import xgboost as xgb
+import catboost as cb
+from sklearn.model_selection import StratifiedKFold, KFold
+from sklearn.metrics import roc_auc_score, mean_squared_error
+from sklearn.preprocessing import OrdinalEncoder
+from sklearn.base import BaseEstimator, TransformerMixin
+# Type aliases
+ModelKey = Literal['lgb', 'xgb', 'cb']
+PredictionType = Literal['classification', 'regression']
+def cv_score_predict(
+    X: pd.DataFrame,
+    y: Union[pd.Series, np.ndarray],
+    X_test: Optional[pd.DataFrame] = None,
+    pred_type: PredictionType = None,  # 'classification' or 'regression' (mandatory)
+    processor: Optional[Union[BaseEstimator, TransformerMixin]] = None,
+    process_categorical: bool = True,
+    models: Union[List[ModelKey], ModelKey] = ('lgb', 'xgb', 'cb'),
+    params_dict: Optional[Dict[str, dict]] = None,
+    scoring_dict: Optional[Dict[str, Callable]] = None,
+    decision_threshold: float = 0.5,
+    n_splits: int = 5,
+    random_state: Union[int, List[int]] = 42,
+    early_stopping_rounds: int = 50,
+    verbose: int = 2,
+    return_trained: bool = False,
+    return_oe: bool = False,
+    predict_proba: bool = True,
+) -> Tuple[np.ndarray, Optional[np.ndarray], Optional[List[Any]], Optional[OrdinalEncoder]]:
+    """
+    Cross-validate supported estimators (optionally repeated over multiple seeds),
+    collect out‑of‑fold (OOF) predictions for scoring, and produce averaged
+    test‑set predictions for final use. Accepts a scikit‑learn style processor
+    pipeline to apply on each fold.
+    Important behavior
+    ------------------
+    - Early stopping: estimators are trained with early stopping on each fold's
+      validation set. Final test predictions (when `X_test` is provided) are
+      produced by the early‑stopped estimators from each fold and averaged.
+    - Processor contract: if a `processor` is provided it **must** return a
+      pandas DataFrame from `.fit_transform` and `.transform`. To guarantee
+      this, call `pipeline.set_output(transform='pandas')`. This preserves
+      column names and dtypes (including `category`) required by some models.
+    Parameters
+    ----------
+    X : pd.DataFrame
+        Training features.
+    y : pd.Series or np.ndarray
+        Target values.
+    X_test : pd.DataFrame or None, optional
+        Final test set to predict. If None, no test predictions are produced.
+    pred_type : str
+        Either 'classification' or 'regression'.
+    processor : object or None, optional
+        Preprocessing pipeline with `fit_transform` and `transform` methods.
+        Must return a pandas DataFrame.
+    process_categorical : bool, default True
+        If True, object/category columns are encoded using an OrdinalEncoder
+        fitted on the training DataFrame only (no leakage), then converted to
+        pandas `category` dtype so libraries that auto‑detect categories work
+        correctly. If False, the user is responsible for categorical handling
+        (for example, inside `processor`).
+    models : list or str, default ('lgb', 'xgb', 'cb')
+        Model keys to train. Supported values: 'lgb', 'xgb', 'cb'.
+    params_dict : dict or None, optional
+        Mapping `model_name -> dict` of model parameters. If None, sensible
+        defaults are used. Per‑model entries override top‑level defaults.
+    scoring_dict : dict or None, optional
+        Mapping `metric_name -> callable(y_true, y_pred_or_proba)`. If None,
+        defaults are provided (classification: ROC AUC; regression: RMSE).
+    decision_threshold : float, default 0.5
+        Threshold to convert probabilities to class labels for threshold‑based metrics.
+    n_splits : int, default 5
+        Number of CV folds.
+    random_state : int or list of ints, default 42
+        Single seed or list of seeds to repeat CV. Results are averaged across seeds.
+    early_stopping_rounds : int, default 50
+        Default early stopping rounds used when model params do not override it.
+    verbose : int, default 2
+        2 prints detailed per‑fold/per‑model scores,
+        1 prints only final averaged scores,
+        0 prints nothing.
+    return_trained : bool, default False
+        If True, return the list of trained estimator instances (one per model
+        per fold per seed). If False (default), trained estimators are not
+        accumulated and `None` is returned in that position to save memory.
+    return_oe : bool, default False
+        If True, return the fitted `OrdinalEncoder` instance (or None if no
+        categorical processing was performed). Returning `oe` lets the user
+        reproduce categorical encoding on new raw data; the user must still
+        apply the same `processor` (if used) before applying `oe` and predicting.
+    predict_proba : bool, default True
+        For classification: if True return probabilities; if False return binary
+        labels using `decision_threshold`. Ignored for regression.
+    Returns
+    -------
+    oof_preds_total : np.ndarray
+        Averaged out‑of‑fold predictions (probabilities for classification when
+        `predict_proba=True`, otherwise binary labels for classification;
+        predictions for regression).
+    test_preds_total : np.ndarray or None
+        Averaged test‑set predictions across folds and seeds, or None if
+        `X_test` is None.
+    trained_models_or_none : list or None
+        If `return_trained=True`, the list of trained model instances (order preserved).
+        Otherwise None.
+    oe_or_none : OrdinalEncoder or None
+        The fitted `OrdinalEncoder` if `return_oe=True` and categorical processing
+        was performed; otherwise None.
+    """
+    # Input Validation
+    if pred_type not in ('classification', 'regression'):
+        raise ValueError("pred_type must be 'classification' or 'regression'")
+    if models is None:
+        raise ValueError("`models` cannot be None.")
+    if isinstance(models, str):
+        models = [models]
+    allowed = {'lgb', 'xgb', 'cb'}
+    for m in models:
+        if m not in allowed:
+            raise ValueError(f"Unsupported model '{m}'. Allowed: {allowed}")
+    if isinstance(random_state, int):
+        random_states = [random_state]
+    else:
+        random_states = list(random_state)
+    if X_test is not None and len(X_test) == 0:
+        raise ValueError("`X_test` must not be empty if provided.")
+    if len(X) != len(y):
+        raise ValueError("`X` and `y` must have the same number of samples.")
+    # Default scoring
+    if scoring_dict is None:
+        if pred_type == 'classification':
+            scoring_dict = {'roc_auc': roc_auc_score}
+        else:
+            scoring_dict = {'rmse': lambda y_true, y_pred: float(np.sqrt(mean_squared_error(y_true, y_pred)))}
+    # Default parameters
+    if params_dict is None:
+        params_dict = {m: {} for m in models}
+    else:
+        for m in models:
+            params_dict.setdefault(m, {})
+    # Processor fallback (identity)
+    class _IdentityProcessor:
+        def fit_transform(self, X, y=None): return X
+        def transform(self, X): return X
+    if processor is None:
+        processor = _IdentityProcessor()
+    elif not hasattr(processor, 'fit_transform') or not hasattr(processor, 'transform'):
+        raise TypeError("`processor` must have `fit_transform` and `transform` methods.")
+    # Defensive Copies
+    X = X.copy().reset_index(drop=True)
+    y = pd.Series(y).copy().reset_index(drop=True) if isinstance(y, (pd.Series, np.ndarray)) else np.asarray(y)
+    if X_test is not None:
+        X_test = X_test.copy().reset_index(drop=True)
+    # Categorical handling
+    cat_cols = X.select_dtypes(include=['object', 'category']).columns.tolist()
+    ordinal_encoder: Optional[OrdinalEncoder] = None
+    if cat_cols and process_categorical:
+        oe = OrdinalEncoder(
+        dtype=np.int32,
+        handle_unknown='use_encoded_value',
+        unknown_value=-1,
+        encoded_missing_value=-1,
+        ).set_output(transform='pandas')
+        X[cat_cols] = oe.fit_transform(X[cat_cols]).astype('category')
+        if X_test is not None:
+            X_test[cat_cols] = oe.transform(X_test[cat_cols]).astype('category')
+        ordinal_encoder = oe
+        # Set model-specific categorical flags
+        for m in models:
+            if m == 'xgb':
+                params_dict['xgb']['enable_categorical'] = True
+            elif m == 'cb':
+                params_dict['cb']['cat_features'] = cat_cols
+    # Prepare result containers
+    n_samples = len(X)
+    test_n = len(X_test) if X_test is not None else 0
+    oof_preds_total = np.zeros(n_samples, dtype=np.float64)
+    test_preds_total = np.zeros(test_n, dtype=np.float64) if X_test is not None else None
+    trained_models_list: List[Any] = [] if return_trained else None
+    # CV results storage
+    cv_results = {
+        'stacked': {name: [] for name in scoring_dict.keys()},
+        'per_model': {m: {name: [] for name in scoring_dict.keys()} for m in models},
+        'per_seed': [],
+    }
+    # Helper for controlled printing
+    def _print(msg, level=2):
+        if verbose >= level:
+            print(msg)
+    # Main loop across random states
+    for seed in random_states:
+        _print(f'\n=== Random State {seed} ===', level=2)
+        splitter = (
+            StratifiedKFold(n_splits=n_splits, shuffle=True, random_state=seed)
+            if pred_type == 'classification'
+            else KFold(n_splits=n_splits, shuffle=True, random_state=seed)
+        )
+        oof_preds = np.zeros(n_samples, dtype=float)
+        test_preds = np.zeros(test_n, dtype=float) if X_test is not None else None
+        # Per-seed storage for reporting
+        seed_model_scores = {m: {name: [] for name in scoring_dict.keys()} for m in models}
+        seed_stack_scores = {metric_name: [] for metric_name in scoring_dict.keys()}
+        for fold, (train_idx, val_idx) in enumerate(splitter.split(X, y)):
+            _print(f'\nFold {fold + 1}/{n_splits}', level=2)
+            y = y if isinstance(y, pd.Series) else pd.Series(y)
+            X_train, X_val = X.iloc[train_idx].copy(), X.iloc[val_idx].copy()
+            y_train, y_val = y.iloc[train_idx], y.iloc[val_idx]
+            # Apply processor if provided (fit on fold train only)
+            X_train = processor.fit_transform(X_train, y_train)
+            X_val = processor.transform(X_val)
+            X_test_proc = processor.transform(X_test) if X_test is not None else None
+            # Ensure processor returns DataFrame (so categorical dtypes are preserved)
+            if not isinstance(X_train, pd.DataFrame):
+                raise TypeError("processor.fit_transform must return a pandas DataFrame. "
+                                "Use pipeline.set_output(transform='pandas').")
+            fold_val_preds_list = []
+            fold_test_preds_list = []
+            for model_name in models:
+                p = params_dict.get(model_name, {}).copy()
+                # Train model
+                if model_name == 'lgb':
+                    ModelClass = lgb.LGBMClassifier if pred_type == 'classification' else lgb.LGBMRegressor
+                    p.setdefault('n_estimators', 10000)
+                    p.setdefault('verbosity', -1)
+                    model = ModelClass(**p)
+                    model.fit(
+                        X_train, y_train,
+                        eval_set=[(X_val, y_val)],
+                        callbacks=[lgb.early_stopping(early_stopping_rounds, verbose=False)]
+                    )
+                elif model_name in ['xgb', 'cb']:
+                    p.setdefault('early_stopping_rounds', early_stopping_rounds)
+                    if model_name == 'xgb':
+                        ModelClass = xgb.XGBClassifier if pred_type == 'classification' else xgb.XGBRegressor
+                        p.setdefault('n_estimators', 10000)
+                    else:
+                        ModelClass = cb.CatBoostClassifier if pred_type == 'classification' else cb.CatBoostRegressor
+                        p.setdefault('iterations', 10000)
+                    model = ModelClass(**p)
+                    model.fit(X_train, y_train, eval_set=[(X_val, y_val)], verbose=False)
+                # Append trained model instance only if requested
+                if return_trained:
+                    trained_models_list.append(model)
+                # Predictions
+                if pred_type == 'classification':
+                    # Prefer predict_proba; if user requested binary output at top-level,
+                    # we still compute probabilities here and convert later if needed
+                    val_preds = model.predict_proba(X_val)[:, 1]
+                    test_fold_preds = model.predict_proba(X_test_proc)[:, 1] if X_test_proc is not None else None
+                else:  # regression
+                    val_preds = model.predict(X_val)
+                    test_fold_preds = model.predict(X_test_proc) if X_test_proc is not None else None
+                fold_val_preds_list.append(val_preds)
+                if X_test is not None:
+                    fold_test_preds_list.append(test_fold_preds)
+                # Score individual model on this fold
+                if pred_type == 'classification':
+                    val_binary = (val_preds >= decision_threshold).astype(int)
+                    for metric_name, scoring_fn in scoring_dict.items():
+                        name_l = metric_name.lower()
+                        if any(k in name_l for k in ('roc', 'auc', 'logloss', 'log_loss')):
+                            score = scoring_fn(y_val, val_preds)
+                        else:
+                            score = scoring_fn(y_val, val_binary)
+                        cv_results['per_model'][model_name][metric_name].append(score)
+                        seed_model_scores[model_name][metric_name].append(score)
+                        _print(f'  {model_name.upper()} {metric_name}: {score:.5f}', level=2)
+                else:
+                    for metric_name, scoring_fn in scoring_dict.items():
+                        score = scoring_fn(y_val, val_preds)
+                        cv_results['per_model'][model_name][metric_name].append(score)
+                        seed_model_scores[model_name][metric_name].append(score)
+                        _print(f'  {model_name.upper()} {metric_name}: {score:.5f}', level=2)
+            # Aggregate fold predictions (average across models)
+            fold_val_preds = np.mean(np.vstack(fold_val_preds_list), axis=0)
+            fold_test_preds = np.mean(np.vstack(fold_test_preds_list), axis=0) if X_test is not None else None
+            # Fill OOF and accumulate test preds
+            oof_preds[val_idx] = fold_val_preds
+            if X_test is not None:
+                test_preds += fold_test_preds / n_splits
+            # Score stacked prediction
+            if pred_type == 'classification':
+                fold_val_binary = (fold_val_preds >= decision_threshold).astype(int)
+                for metric_name, scoring_fn in scoring_dict.items():
+                    name_l = metric_name.lower()
+                    if any(k in name_l for k in ('roc', 'auc', 'logloss', 'log_loss')):
+                        stacked_score = scoring_fn(y_val, fold_val_preds)
+                    else:
+                        stacked_score = scoring_fn(y_val, fold_val_binary)
+                    cv_results['stacked'][metric_name].append(stacked_score)
+                    seed_stack_scores[metric_name].append(stacked_score)
+                    _print(f'  Stacked {metric_name}: {stacked_score:.5f}', level=2)
+            else:
+                for metric_name, scoring_fn in scoring_dict.items():
+                    stacked_score = scoring_fn(y_val, fold_val_preds)
+                    cv_results['stacked'][metric_name].append(stacked_score)
+                    seed_stack_scores[metric_name].append(stacked_score)
+                    _print(f'  Stacked {metric_name}: {stacked_score:.5f}', level=2)
+        # --- End of folds for this seed ---
+        # Accumulate across seeds
+        oof_preds_total += oof_preds / len(random_states)
+        if X_test is not None:
+            test_preds_total += test_preds / len(random_states)
+        # Print per-model means (seed)
+        _print(f'\nSeed {seed} mean scores:', level=2)
+        for model_name in models:
+            for metric_name, vals in seed_model_scores[model_name].items():
+                mean_val = float(np.mean(vals)) if vals else float('nan')
+                _print(f'  {model_name.upper()} {metric_name}: {mean_val:.5f}', level=2)
+        # Print stacked mean scores (seed)
+        seed_mean_scores = {k: float(np.mean(v)) for k, v in seed_stack_scores.items()}
+        for metric_name, score in seed_mean_scores.items():
+            _print(f'  Stacked {metric_name}: {score:.5f}', level=2)
+    # Final summary print
+    if verbose >= 1:
+        print('\n' + '=' * 30)
+        print('=== CV Results Summary ===\n')
+        print('Mean CV Scores per Model:')
+        for model_name in models:
+            print(f'\n--- {model_name.upper()} ---')
+            for metric_name, scores in cv_results['per_model'][model_name].items():
+                print(f'  {metric_name}: {np.mean(scores):.5f}')
+        print('\nMean Stacked CV Scores:')
+        for metric_name, scores in cv_results['stacked'].items():
+            print(f'  {metric_name}: {np.mean(scores):.5f}')
+    # Post-process outputs for classification when predict_proba flag is False
+    if pred_type == 'classification' and not predict_proba:
+        # Convert averaged probabilities to binary labels using decision_threshold
+        oof_preds_total = (oof_preds_total >= decision_threshold).astype(int)
+        if test_preds_total is not None:
+            test_preds_total = (test_preds_total >= decision_threshold).astype(int)
+    # Prepare return values
+    test_preds_return = test_preds_total if X_test is not None else None
+    trained_return = trained_models_list if return_trained else None
+    oe_return = ordinal_encoder if return_oe else None
+    return oof_preds_total, test_preds_return, trained_return, oe_return

cv_score_predict-0.1.1/cv_score_predict.egg-info/PKG-INFO ADDED Viewed

@@ -0,0 +1,170 @@
+Metadata-Version: 2.4
+Name: cv-score-predict
+Version: 0.1.1
+Summary: Cross-validated ensemble prediction with LGBM, XGBoost, and CatBoost — with safe categorical handling, multi-seed averaging, and artifact return.
+Author-email: Danu ANDRIES <danu@andries.lu>
+License: MIT
+Project-URL: Homepage, https://github.com/Karabush/cv-score-predict
+Project-URL: Repository, https://github.com/Karabush/cv-score-predict
+Project-URL: Documentation, https://github.com/Karabush/cv-score-predict#readme
+Keywords: cross-validation,ensemble learning,model averaging,LightGBM,XGBoost,CatBoost,categorical encoding,OrdinalEncoder,out-of-fold prediction,OOF,multi-seed CV,repeated cross-validation,early stopping,scikit-learn compatible,pandas,machine learning,classification,regression,model validation,kaggle,safe preprocessing,data leakage prevention,boosting ensemble
+Classifier: Programming Language :: Python :: 3
+Classifier: Intended Audience :: Developers
+Classifier: Intended Audience :: Science/Research
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Requires-Python: >=3.9
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: numpy>=1.21
+Requires-Dist: pandas>=1.3
+Requires-Dist: scikit-learn>=1.4
+Requires-Dist: lightgbm>=3.3
+Requires-Dist: xgboost>=1.7
+Requires-Dist: catboost>=1.2
+Dynamic: license-file
+# cv-score-predict
+A robust utility for **cross-validated ensemble prediction** with LightGBM, XGBoost and CatBoost. Handles categorical features safely, supports custom preprocessing pipelines, repeated CV over multiple seeds, early stopping, and returns out-of-fold (OOF) predictions, test predictions, trained models, and fitted encoder — all in one call.
+Designed for **kagglers, ML engineers, and data scientists** who need reliable, leakage-free CV with minimal boilerplate.
+---
+## ✨ Key Features
+- **Multi-model ensembling**: Train and average predictions from LGBM, XGBoost and CatBoost in a single CV run.
+- **Native categorical support**: Automatically encodes string/categorical columns with `OrdinalEncoder` and configures models (e.g., `cat_features` for CatBoost, `enable_categorical` for XGBoost).
+- **Safe preprocessing**: Integrates any scikit-learn-compatible `processor` pipeline (e.g., `ColumnTransformer`, `Pipeline`) — fitted **per fold** to prevent data leakage.
+- **Repeated CV**: Average results over multiple random seeds for stable metrics.
+- **Early stopping**: Enabled by default for all models using fold-wise validation.
+- **Full artifact return**: Get OOF predictions, test predictions, trained models, and fitted `OrdinalEncoder` for later use.
+---
+## 📥 Parameters
+| Parameter | Type | Default | Description |
+|----------|------|--------|-------------|
+| `X` | `pd.DataFrame` | — | Training features. |
+| `y` | `Union[pd.Series, np.ndarray]` | — | Target values. |
+| `X_test` | `Optional[pd.DataFrame]` | `None` | Test set for final prediction. If `None`, no test predictions are returned. |
+| `pred_type` | `str` | — | Either `'classification'` or `'regression'` (**required**). |
+| `processor` | `Optional[object]` | `None` | Preprocessing pipeline with `fit_transform` and `transform` methods. Must return a `pd.DataFrame` (use `set_output(transform='pandas')`). If `None`, features are passed through unchanged. |
+| `process_categorical` | `bool` | `True` | If `True`, object/category columns are encoded with `OrdinalEncoder` (using `-1` for missing/unseen) and converted to pandas `category` dtype for model compatibility. |
+| `models` | `Union[List[str], str]` | `('lgb', 'xgb', 'cb')` | Models to ensemble. Supported: `'lgb'` (LightGBM), `'xgb'` (XGBoost), `'cb'` (CatBoost). |
+| `params_dict` | `Optional[Dict[str, dict]]` | `None` | Model-specific hyperparameters. Keys: model names; values: param dicts. |
+| `scoring_dict` | `Optional[Dict[str, Callable]]` | `None` | Metrics for evaluation. Keys: metric names; values: scoring functions (e.g., `roc_auc_score`). Defaults: `{'roc_auc': roc_auc_score}` (classification), `{'rmse': rmse_fn}` (regression). |
+| `decision_threshold` | `float` | `0.5` | Threshold to convert probabilities to class labels (classification only). |
+| `n_splits` | `int` | `5` | Number of cross-validation folds. |
+| `random_state` | `Union[int, List[int]]` | `42` | Seed(s) for reproducibility. If a list, CV is repeated for each seed and results are averaged. |
+| `early_stopping_rounds` | `int` | `50` | Early stopping rounds for boosting models (if not overridden in `params_dict`). |
+| `verbose` | `int` | `2` | Logging level: `2` = full per-fold details, `1` = final summary, `0` = silent. |
+| `return_trained` | `bool` | `False` | If `True`, returns list of trained model instances (one per model × fold × seed). |
+| `return_oe` | `bool` | `False` | If `True` and `process_categorical=True`, returns the fitted `OrdinalEncoder`. |
+| `predict_proba` | `bool` | `True` | For classification: if `True`, return probabilities; if `False`, return binary labels (using `decision_threshold`). Ignored for regression. |
+---
+## 🚀 Installation
+```bash
+pip install cv-score-predict
+```
+Requirements:
+* Python ≥ 3.8
+* Dependencies (automatically installed):
+numpy, pandas, scikit-learn ≥1.4, lightgbm, xgboost, catboost
+---
+## 📌 Basic Usage
+```python
+import pandas as pd
+import numpy as np
+from sklearn.preprocessing import StandardScaler
+from sklearn.compose import make_column_transformer
+from cv_score_predict import cv_score_predict
+# Simulate data
+X = pd.DataFrame({
+    "num": [1, 2, 3, 4, 5, 6, 7, 8],
+    "cat": ["A", "B", "A", "C", "B", "A", "C", "D"]
+})
+y = [0, 1, 0, 1, 1, 0, 1, 0]
+X_test = pd.DataFrame({"num": [9, 10], "cat": ["B", "E"]})
+# Optional processor (applied per fold!)
+processor = make_column_transformer(
+    (StandardScaler(), ["num"]),
+    remainder="passthrough"
+)
+# Run CV with 3 seeds → results averaged over seeds & folds
+oof_pred, test_pred, _, _ = cv_score_predict(
+    X=X,
+    y=y,
+    X_test=X_test,
+    pred_type="classification",
+    processor=processor,
+    models=["lgb", "xgb"],
+    process_categorical=True,
+    random_state=[42, 123, 999],
+    n_splits=3,
+    verbose=2,
+)
+```
+Output will show scores per seed, then final averaged metrics.
+---
+## 🔧 Advanced Usage: Reuse Artifacts for New Data
+```python
+# Step 1: Run CV and return artifacts
+oof, _, trained_models, oe = cv_score_predict(
+    X,
+    y,
+    X_test=None,  # we'll predict manually
+    pred_type="classification",
+    processor=processor,
+    models=["lgb", "cb"],
+    process_categorical=True,
+    random_state=[42, 123],
+    n_splits=5,
+    return_trained=True,
+    return_oe=True,
+)
+# Step 2: For deployment: refit processor on FULL TRAINING data
+# First: encode categoricals using returned oe
+cat_cols = ["cat"]
+X_full = X.copy()
+X_full[cat_cols] = oe.transform(X_full[cat_cols]).astype('category')
+X_new = pd.DataFrame({"num": [7, 8], "cat": [None, "A"]})
+# Fit processor on full encoded data
+processor = make_column_transformer(
+    (StandardScaler(), ["num"]),
+    remainder="passthrough"
+)
+processor.fit(X_full)
+# Apply to new data
+X_new_proc = X_new.copy()
+X_new_proc[cat_cols] = oe.transform(X_new_proc[cat_cols]).astype('category')
+X_new_proc = processor.transform(X_new_proc)
+# Predict with all trained models and average
+preds = [model.predict_proba(X_new_proc)[:, 1] for model in trained_models]
+final_pred = np.mean(preds, axis=0)
+```
+## 📝 Notes
+Categorical columns are encoded with OrdinalEncoder(dtype=np.int32) and converted to category dtype for model compatibility.
+Always use set_output(transform="pandas") in sklearn pipelines to preserve dtypes.
+The processor used in CV is refit on each fold to prevent data leakage, so there is no single global version. For deployment, refit your preprocessing pipeline on the full training set (as shown in the advanced example).
+## 📄 License
+This project is licensed under the MIT License.
+See the LICENSE file for details.

cv_score_predict-0.1.1/cv_score_predict.egg-info/SOURCES.txt ADDED Viewed

@@ -0,0 +1,13 @@
+LICENSE
+MANIFEST.in
+README.md
+pyproject.toml
+cv_score_predict/__init__.py
+cv_score_predict/core.py
+cv_score_predict.egg-info/PKG-INFO
+cv_score_predict.egg-info/SOURCES.txt
+cv_score_predict.egg-info/dependency_links.txt
+cv_score_predict.egg-info/requires.txt
+cv_score_predict.egg-info/top_level.txt
+tests/test_cv_score_predict.py
+tests/test_regression_no_processor_binary_output.py

cv_score_predict-0.1.1/cv_score_predict.egg-info/dependency_links.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+

cv_score_predict-0.1.1/cv_score_predict.egg-info/requires.txt ADDED Viewed

@@ -0,0 +1,6 @@
+numpy>=1.21
+pandas>=1.3
+scikit-learn>=1.4
+lightgbm>=3.3
+xgboost>=1.7
+catboost>=1.2

cv_score_predict-0.1.1/cv_score_predict.egg-info/top_level.txt ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ cv_score_predict
2	+ dist

cv_score_predict-0.1.1/pyproject.toml ADDED Viewed

@@ -0,0 +1,61 @@
+[build-system]
+requires = ["setuptools>=70.0", "wheel"]
+build-backend = "setuptools.build_meta"
+[project]
+name = "cv-score-predict"
+version = "0.1.1"
+description = "Cross-validated ensemble prediction with LGBM, XGBoost, and CatBoost — with safe categorical handling, multi-seed averaging, and artifact return."
+readme = "README.md"
+requires-python = ">=3.9"
+license = { text = "MIT" }
+authors = [
+    { name = "Danu ANDRIES", email = "danu@andries.lu" },
+]
+classifiers = [
+    "Programming Language :: Python :: 3",
+    "Intended Audience :: Developers",
+    "Intended Audience :: Science/Research",
+    "Topic :: Scientific/Engineering :: Artificial Intelligence",
+]
+dependencies = [
+    "numpy>=1.21",
+    "pandas>=1.3",
+    "scikit-learn>=1.4",
+    "lightgbm>=3.3",
+    "xgboost>=1.7",
+    "catboost>=1.2"
+]
+keywords = [
+    "cross-validation",
+    "ensemble learning",
+    "model averaging",
+    "LightGBM",
+    "XGBoost",
+    "CatBoost",
+    "categorical encoding",
+    "OrdinalEncoder",
+    "out-of-fold prediction",
+    "OOF",
+    "multi-seed CV",
+    "repeated cross-validation",
+    "early stopping",
+    "scikit-learn compatible",
+    "pandas",
+    "machine learning",
+    "classification",
+    "regression",
+    "model validation",
+    "kaggle",
+    "safe preprocessing",
+    "data leakage prevention",
+    "boosting ensemble"
+]
+[tool.setuptools.packages.find]
+exclude = ["tests*", "notebooks*", "temp*", "scripts*", "*catboost*"]
+[project.urls]
+Homepage = "https://github.com/Karabush/cv-score-predict"
+Repository = "https://github.com/Karabush/cv-score-predict"
+Documentation = "https://github.com/Karabush/cv-score-predict#readme"

cv_score_predict-0.1.1/setup.cfg ADDED Viewed

@@ -0,0 +1,4 @@
+[egg_info]
+tag_build =
+tag_date = 0

cv_score_predict-0.1.1/tests/test_cv_score_predict.py ADDED Viewed

@@ -0,0 +1,44 @@
+def test_classification_full_pipeline():
+    import pandas as pd
+    from sklearn.preprocessing import StandardScaler
+    from sklearn.compose import ColumnTransformer
+    from cv_score_predict import cv_score_predict
+    # Data with categoricals and missing
+    X = pd.DataFrame({
+        "num": [1.0, 2.5, 3.1, 4.8, 5.2, 6.0, 7.3, 8.9],
+        "cat": ["X", "Y", "X", "Z", "Y", "X", "Z", "W"]
+    })
+    y = [0, 1, 0, 1, 1, 0, 1, 0]
+    X_test = pd.DataFrame({"num": [9.1, 10.2], "cat": ["Y", "V"]})  # V is unseen
+    processor = ColumnTransformer([
+        ("num", StandardScaler(), ["num"]),
+        ("cat", "passthrough", ["cat"])
+    ]).set_output(transform="pandas")
+    oof, test_pred, trained, oe = cv_score_predict(
+        X=X,
+        y=y,
+        X_test=X_test,
+        pred_type="classification",
+        processor=processor,
+        process_categorical=True,
+        models=["lgb", "xgb"],
+        random_state=[42, 99],
+        n_splits=2,
+        return_trained=True,
+        return_oe=True,
+        verbose=0
+    )
+    # Assertions
+    assert len(oof) == len(X)
+    assert len(test_pred) == len(X_test)
+    assert test_pred.min() >= 0 and test_pred.max() <= 1  # probabilities
+    assert len(trained) == 2 * 2 * 2  # 2 models × 2 folds × 2 seeds
+    assert oe is not None
+    # Check that unseen category 'V' was encoded as -1
+    X_enc = oe.transform(X_test[["cat"]])
+    assert X_enc.iloc[1, 0] == -1  # 'V' → -1

cv_score_predict-0.1.1/tests/test_regression_no_processor_binary_output.py ADDED Viewed

@@ -0,0 +1,27 @@
+def test_regression_no_processor_binary_output():
+    import pandas as pd
+    import numpy as np
+    from cv_score_predict import cv_score_predict
+    np.random.seed(0)
+    X = pd.DataFrame(np.random.randn(20, 3), columns=["a", "b", "c"])
+    y = X.sum(axis=1) + np.random.randn(20) * 0.1
+    X_test = pd.DataFrame(np.random.randn(5, 3), columns=["a", "b", "c"])
+    oof, test_pred, _, _ = cv_score_predict(
+        X=X,
+        y=y,
+        X_test=X_test,
+        pred_type="regression",
+        processor=None,
+        models=["lgb", "cb"],
+        random_state=[1, 2, 3],  # 3 seeds
+        n_splits=3,
+        predict_proba=False,  # irrelevant for regression, but should not break
+        verbose=0
+    )
+    assert len(oof) == 20
+    assert len(test_pred) == 5
+    assert isinstance(oof[0], float)
+    assert isinstance(test_pred[0], float)