PyPI - ins-pricing - Versions diffs - 0.4.4__py3-none-any.whl → 0.5.0__py3-none-any.whl - Mend

ins-pricing 0.4.4py3-none-any.whl → 0.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (96) hide show

ins_pricing/README.md +74 -56
ins_pricing/__init__.py +142 -90
ins_pricing/cli/BayesOpt_entry.py +52 -50
ins_pricing/cli/BayesOpt_incremental.py +832 -898
ins_pricing/cli/Explain_Run.py +31 -23
ins_pricing/cli/Explain_entry.py +532 -579
ins_pricing/cli/Pricing_Run.py +31 -23
ins_pricing/cli/bayesopt_entry_runner.py +1440 -1438
ins_pricing/cli/utils/cli_common.py +256 -256
ins_pricing/cli/utils/cli_config.py +375 -375
ins_pricing/cli/utils/import_resolver.py +382 -365
ins_pricing/cli/utils/notebook_utils.py +340 -340
ins_pricing/cli/watchdog_run.py +209 -201
ins_pricing/frontend/README.md +573 -419
ins_pricing/frontend/__init__.py +10 -10
ins_pricing/frontend/config_builder.py +1 -0
ins_pricing/frontend/example_workflows.py +1 -1
ins_pricing/governance/__init__.py +20 -20
ins_pricing/governance/release.py +159 -159
ins_pricing/modelling/README.md +67 -0
ins_pricing/modelling/__init__.py +147 -92
ins_pricing/modelling/bayesopt/README.md +59 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/__init__.py +64 -102
ins_pricing/modelling/{core/bayesopt → bayesopt}/config_preprocess.py +562 -550
ins_pricing/modelling/{core/bayesopt → bayesopt}/core.py +965 -962
ins_pricing/modelling/{core/bayesopt → bayesopt}/model_explain_mixin.py +296 -296
ins_pricing/modelling/{core/bayesopt → bayesopt}/model_plotting_mixin.py +482 -548
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/__init__.py +27 -27
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_ft_trainer.py +915 -913
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_gnn.py +788 -785
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_resn.py +448 -446
ins_pricing/modelling/bayesopt/trainers/__init__.py +19 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_base.py +1308 -1308
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_ft.py +3 -3
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_glm.py +197 -198
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_gnn.py +344 -344
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_resn.py +283 -283
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_xgb.py +346 -347
ins_pricing/modelling/bayesopt/utils/__init__.py +67 -0
ins_pricing/modelling/bayesopt/utils/constants.py +21 -0
ins_pricing/modelling/bayesopt/utils/io_utils.py +7 -0
ins_pricing/modelling/bayesopt/utils/losses.py +27 -0
ins_pricing/modelling/bayesopt/utils/metrics_and_devices.py +17 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/torch_trainer_mixin.py +623 -623
ins_pricing/modelling/{core/evaluation.py → evaluation.py} +113 -104
ins_pricing/modelling/explain/__init__.py +55 -55
ins_pricing/modelling/explain/metrics.py +27 -174
ins_pricing/modelling/explain/permutation.py +237 -237
ins_pricing/modelling/plotting/__init__.py +40 -36
ins_pricing/modelling/plotting/compat.py +228 -0
ins_pricing/modelling/plotting/curves.py +572 -572
ins_pricing/modelling/plotting/diagnostics.py +163 -163
ins_pricing/modelling/plotting/geo.py +362 -362
ins_pricing/modelling/plotting/importance.py +121 -121
ins_pricing/pricing/__init__.py +27 -27
ins_pricing/production/__init__.py +35 -25
ins_pricing/production/{predict.py → inference.py} +140 -57
ins_pricing/production/monitoring.py +8 -21
ins_pricing/reporting/__init__.py +11 -11
ins_pricing/setup.py +1 -1
ins_pricing/tests/production/test_inference.py +90 -0
ins_pricing/utils/__init__.py +116 -83
ins_pricing/utils/device.py +255 -255
ins_pricing/utils/features.py +53 -0
ins_pricing/utils/io.py +72 -0
ins_pricing/{modelling/core/bayesopt/utils → utils}/losses.py +125 -129
ins_pricing/utils/metrics.py +158 -24
ins_pricing/utils/numerics.py +76 -0
ins_pricing/utils/paths.py +9 -1
{ins_pricing-0.4.4.dist-info → ins_pricing-0.5.0.dist-info}/METADATA +55 -35
ins_pricing-0.5.0.dist-info/RECORD +131 -0
ins_pricing/CHANGELOG.md +0 -272
ins_pricing/RELEASE_NOTES_0.2.8.md +0 -344
ins_pricing/docs/LOSS_FUNCTIONS.md +0 -78
ins_pricing/docs/modelling/BayesOpt_USAGE.md +0 -945
ins_pricing/docs/modelling/README.md +0 -34
ins_pricing/frontend/QUICKSTART.md +0 -152
ins_pricing/modelling/core/BayesOpt.py +0 -146
ins_pricing/modelling/core/__init__.py +0 -1
ins_pricing/modelling/core/bayesopt/PHASE2_REFACTORING_SUMMARY.md +0 -449
ins_pricing/modelling/core/bayesopt/PHASE3_REFACTORING_SUMMARY.md +0 -406
ins_pricing/modelling/core/bayesopt/REFACTORING_SUMMARY.md +0 -247
ins_pricing/modelling/core/bayesopt/trainers/__init__.py +0 -19
ins_pricing/modelling/core/bayesopt/utils/__init__.py +0 -86
ins_pricing/modelling/core/bayesopt/utils/constants.py +0 -183
ins_pricing/modelling/core/bayesopt/utils/io_utils.py +0 -126
ins_pricing/modelling/core/bayesopt/utils/metrics_and_devices.py +0 -555
ins_pricing/modelling/core/bayesopt/utils.py +0 -105
ins_pricing/modelling/core/bayesopt/utils_backup.py +0 -1503
ins_pricing/tests/production/test_predict.py +0 -233
ins_pricing-0.4.4.dist-info/RECORD +0 -137
/ins_pricing/modelling/{core/bayesopt → bayesopt}/config_components.py +0 -0
/ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_ft_components.py +0 -0
/ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/distributed_utils.py +0 -0
{ins_pricing-0.4.4.dist-info → ins_pricing-0.5.0.dist-info}/WHEEL +0 -0
{ins_pricing-0.4.4.dist-info → ins_pricing-0.5.0.dist-info}/top_level.txt +0 -0

ins_pricing/modelling/core/bayesopt/utils/metrics_and_devices.py DELETED Viewed

@@ -1,555 +0,0 @@
-"""Metrics computation, GPU management, device selection, CV utilities, and plotting.
-This module contains:
-- get_logger() for package-level logging
-- MetricFactory for consistent metric computation
-- GPUMemoryManager for CUDA memory management (imported from package utils)
-- DeviceManager for device selection and model placement (imported from package utils)
-- CVStrategyResolver for cross-validation strategy selection
-- PlotUtils for lift chart plotting
-- Backward compatibility wrappers for plotting functions
-"""
-from __future__ import annotations
-import gc
-import logging
-import os
-from contextlib import contextmanager
-from functools import lru_cache
-from typing import Any, Dict, List, Optional, Tuple
-import numpy as np
-import pandas as pd
-import torch
-import torch.nn as nn
-from torch.nn.parallel import DistributedDataParallel as DDP
-from sklearn.metrics import log_loss, mean_absolute_error, mean_squared_error, mean_tweedie_deviance
-from sklearn.model_selection import KFold, GroupKFold, TimeSeriesSplit, StratifiedKFold
-# Try to import plotting dependencies
-try:
-    import matplotlib
-    if os.name != "nt" and not os.environ.get("DISPLAY") and not os.environ.get("MPLBACKEND"):
-        matplotlib.use("Agg")
-    import matplotlib.pyplot as plt
-    _MPL_IMPORT_ERROR: Optional[BaseException] = None
-except Exception as exc:
-    matplotlib = None
-    plt = None
-    _MPL_IMPORT_ERROR = exc
-try:
-    from ....plotting import curves as plot_curves_common
-except Exception:
-    try:
-        from ins_pricing.plotting import curves as plot_curves_common
-    except Exception:
-        plot_curves_common = None
-from .constants import EPS
-# Import DeviceManager and GPUMemoryManager from package-level utils
-# (Eliminates ~230 lines of code duplication)
-from ins_pricing.utils import DeviceManager, GPUMemoryManager
-from .io_utils import IOUtils
-# =============================================================================
-# Logging System
-# =============================================================================
-@lru_cache(maxsize=1)
-def _get_package_logger() -> logging.Logger:
-    """Get or create the package-level logger with consistent formatting."""
-    logger = logging.getLogger("ins_pricing")
-    if not logger.handlers:
-        handler = logging.StreamHandler()
-        formatter = logging.Formatter(
-            "[%(levelname)s][%(name)s] %(message)s"
-        )
-        handler.setFormatter(formatter)
-        logger.addHandler(handler)
-        # Default to INFO, can be changed via environment variable
-        level = os.environ.get("INS_PRICING_LOG_LEVEL", "INFO").upper()
-        logger.setLevel(getattr(logging, level, logging.INFO))
-    return logger
-def get_logger(name: str = "ins_pricing") -> logging.Logger:
-    """Get a logger with the given name, inheriting package-level settings.
-    Args:
-        name: Logger name, typically module name like 'ins_pricing.trainer'
-    Returns:
-        Configured logger instance
-    Example:
-        >>> logger = get_logger("ins_pricing.trainer.ft")
-        >>> logger.info("Training started")
-    """
-    _get_package_logger()
-    return logging.getLogger(name)
-# =============================================================================
-# Metric Computation Factory
-# =============================================================================
-class MetricFactory:
-    """Factory for computing evaluation metrics consistently across all trainers.
-    This class centralizes metric computation logic that was previously duplicated
-    across FTTrainer, ResNetTrainer, GNNTrainer, XGBTrainer, and GLMTrainer.
-    Example:
-        >>> factory = MetricFactory(task_type='regression', tweedie_power=1.5)
-        >>> score = factory.compute(y_true, y_pred, sample_weight)
-    """
-    def __init__(
-        self,
-        task_type: str = "regression",
-        tweedie_power: float = 1.5,
-        loss_name: str = "tweedie",
-        clip_min: float = 1e-8,
-        clip_max: float = 1 - 1e-8,
-    ):
-        """Initialize the metric factory.
-        Args:
-            task_type: Either 'regression' or 'classification'
-            tweedie_power: Power parameter for Tweedie deviance (1.0-2.0)
-            loss_name: Regression loss name ('tweedie', 'poisson', 'gamma', 'mse', 'mae')
-            clip_min: Minimum value for clipping predictions
-            clip_max: Maximum value for clipping predictions (for classification)
-        """
-        self.task_type = task_type
-        self.tweedie_power = tweedie_power
-        self.loss_name = loss_name
-        self.clip_min = clip_min
-        self.clip_max = clip_max
-    def compute(
-        self,
-        y_true: np.ndarray,
-        y_pred: np.ndarray,
-        sample_weight: Optional[np.ndarray] = None,
-    ) -> float:
-        """Compute the appropriate metric based on task type.
-        Args:
-            y_true: Ground truth values
-            y_pred: Predicted values
-            sample_weight: Optional sample weights
-        Returns:
-            Computed metric value (lower is better)
-        """
-        y_pred = np.asarray(y_pred)
-        y_true = np.asarray(y_true)
-        if self.task_type == "classification":
-            y_pred_clipped = np.clip(y_pred, self.clip_min, self.clip_max)
-            return float(log_loss(y_true, y_pred_clipped, sample_weight=sample_weight))
-        loss_name = str(self.loss_name or "tweedie").strip().lower()
-        if loss_name in {"mse", "mae"}:
-            if loss_name == "mse":
-                return float(mean_squared_error(
-                    y_true, y_pred, sample_weight=sample_weight))
-            return float(mean_absolute_error(
-                y_true, y_pred, sample_weight=sample_weight))
-        y_pred_safe = np.maximum(y_pred, self.clip_min)
-        power = self.tweedie_power
-        if loss_name == "poisson":
-            power = 1.0
-        elif loss_name == "gamma":
-            power = 2.0
-        return float(mean_tweedie_deviance(
-            y_true,
-            y_pred_safe,
-            sample_weight=sample_weight,
-            power=power,
-        ))
-    def update_power(self, power: float) -> None:
-        """Update the Tweedie power parameter.
-        Args:
-            power: New power value (1.0-2.0)
-        """
-        self.tweedie_power = power
-# =============================================================================
-# GPU Memory Manager and Device Manager
-# =============================================================================
-# NOTE: These classes are imported from ins_pricing.utils (see top of file)
-# This eliminates ~230 lines of duplicate code while maintaining backward compatibility
-# =============================================================================
-# Cross-Validation Strategy Resolver
-# =============================================================================
-class CVStrategyResolver:
-    """Resolver for cross-validation splitting strategies.
-    This class consolidates CV strategy resolution logic that was previously
-    duplicated across trainer_base.py and trainer_ft.py.
-    Supported strategies:
-        - 'random': Standard KFold
-        - 'stratified': StratifiedKFold (for classification)
-        - 'group': GroupKFold (requires group column)
-        - 'time': TimeSeriesSplit (requires time column)
-    Example:
-        >>> resolver = CVStrategyResolver(
-        ...     strategy='group',
-        ...     n_splits=5,
-        ...     group_col='policy_id',
-        ...     data=train_df,
-        ... )
-        >>> splitter, groups = resolver.get_splitter()
-        >>> for train_idx, val_idx in splitter.split(X, y, groups):
-        ...     pass
-    """
-    VALID_STRATEGIES = {"random", "stratified", "group", "grouped", "time", "timeseries", "temporal"}
-    def __init__(
-        self,
-        strategy: str = "random",
-        n_splits: int = 5,
-        shuffle: bool = True,
-        random_state: Optional[int] = None,
-        group_col: Optional[str] = None,
-        time_col: Optional[str] = None,
-        time_ascending: bool = True,
-        data: Optional[pd.DataFrame] = None,
-    ):
-        """Initialize the CV strategy resolver.
-        Args:
-            strategy: CV strategy name
-            n_splits: Number of CV folds
-            shuffle: Whether to shuffle for random/stratified
-            random_state: Random seed for reproducibility
-            group_col: Column name for group-based splitting
-            time_col: Column name for time-based splitting
-            time_ascending: Sort order for time-based splitting
-            data: DataFrame containing group/time columns
-        """
-        self.strategy = strategy.strip().lower()
-        self.n_splits = max(2, int(n_splits))
-        self.shuffle = shuffle
-        self.random_state = random_state
-        self.group_col = group_col
-        self.time_col = time_col
-        self.time_ascending = time_ascending
-        self.data = data
-        if self.strategy not in self.VALID_STRATEGIES:
-            raise ValueError(
-                f"Invalid strategy '{strategy}'. "
-                f"Valid options: {sorted(self.VALID_STRATEGIES)}"
-            )
-    def get_splitter(self) -> Tuple[Any, Optional[pd.Series]]:
-        """Get the appropriate splitter and groups.
-        Returns:
-            Tuple of (splitter, groups) where groups may be None
-        Raises:
-            ValueError: If required columns are missing
-        """
-        if self.strategy in {"group", "grouped"}:
-            return self._get_group_splitter()
-        elif self.strategy in {"time", "timeseries", "temporal"}:
-            return self._get_time_splitter()
-        elif self.strategy == "stratified":
-            return self._get_stratified_splitter()
-        else:
-            return self._get_random_splitter()
-    def _get_random_splitter(self) -> Tuple[KFold, None]:
-        """Get a random KFold splitter."""
-        splitter = KFold(
-            n_splits=self.n_splits,
-            shuffle=self.shuffle,
-            random_state=self.random_state if self.shuffle else None,
-        )
-        return splitter, None
-    def _get_stratified_splitter(self) -> Tuple[StratifiedKFold, None]:
-        """Get a stratified KFold splitter."""
-        splitter = StratifiedKFold(
-            n_splits=self.n_splits,
-            shuffle=self.shuffle,
-            random_state=self.random_state if self.shuffle else None,
-        )
-        return splitter, None
-    def _get_group_splitter(self) -> Tuple[GroupKFold, pd.Series]:
-        """Get a group-based KFold splitter."""
-        if not self.group_col:
-            raise ValueError("group_col is required for group strategy")
-        if self.data is None:
-            raise ValueError("data DataFrame is required for group strategy")
-        if self.group_col not in self.data.columns:
-            raise KeyError(f"group_col '{self.group_col}' not found in data")
-        groups = self.data[self.group_col]
-        splitter = GroupKFold(n_splits=self.n_splits)
-        return splitter, groups
-    def _get_time_splitter(self) -> Tuple[Any, None]:
-        """Get a time-series splitter."""
-        if not self.time_col:
-            raise ValueError("time_col is required for time strategy")
-        if self.data is None:
-            raise ValueError("data DataFrame is required for time strategy")
-        if self.time_col not in self.data.columns:
-            raise KeyError(f"time_col '{self.time_col}' not found in data")
-        splitter = TimeSeriesSplit(n_splits=self.n_splits)
-        # Create an ordered wrapper that sorts by time column
-        order_index = self.data[self.time_col].sort_values(
-            ascending=self.time_ascending
-        ).index
-        order = self.data.index.get_indexer(order_index)
-        return _OrderedSplitter(splitter, order), None
-class _OrderedSplitter:
-    """Wrapper for splitters that need to respect a specific ordering."""
-    def __init__(self, base_splitter, order: np.ndarray):
-        self.base_splitter = base_splitter
-        self.order = order
-    def split(self, X, y=None, groups=None):
-        """Split with ordering applied."""
-        n = len(X)
-        X_ordered = np.arange(n)[self.order]
-        for train_idx, val_idx in self.base_splitter.split(X_ordered):
-            yield self.order[train_idx], self.order[val_idx]
-    def get_n_splits(self, X=None, y=None, groups=None):
-        return self.base_splitter.get_n_splits()
-# =============================================================================
-# Plot Utils
-# =============================================================================
-def _plot_skip(label: str) -> None:
-    """Print message when plot is skipped due to missing matplotlib."""
-    if _MPL_IMPORT_ERROR is not None:
-        print(f"[Plot] Skip {label}: matplotlib unavailable ({_MPL_IMPORT_ERROR}).", flush=True)
-    else:
-        print(f"[Plot] Skip {label}: matplotlib unavailable.", flush=True)
-class PlotUtils:
-    """Plotting utilities for lift charts."""
-    @staticmethod
-    def split_data(data: pd.DataFrame, col_nme: str, wgt_nme: str, n_bins: int = 10) -> pd.DataFrame:
-        """Split data into bins by cumulative weight."""
-        data_sorted = data.sort_values(by=col_nme, ascending=True).copy()
-        data_sorted['cum_weight'] = data_sorted[wgt_nme].cumsum()
-        w_sum = data_sorted[wgt_nme].sum()
-        if w_sum <= EPS:
-            data_sorted['bins'] = 0
-        else:
-            data_sorted['bins'] = np.floor(
-                data_sorted['cum_weight'] * float(n_bins) / w_sum
-            )
-            data_sorted.loc[(data_sorted['bins'] == n_bins),
-                            'bins'] = n_bins - 1
-        return data_sorted.groupby(['bins'], observed=True).sum(numeric_only=True)
-    @staticmethod
-    def plot_lift_ax(ax, plot_data, title, pred_label='Predicted', act_label='Actual', weight_label='Earned Exposure'):
-        """Plot lift chart on given axes."""
-        ax.plot(plot_data.index, plot_data['act_v'],
-                label=act_label, color='red')
-        ax.plot(plot_data.index, plot_data['exp_v'],
-                label=pred_label, color='blue')
-        ax.set_title(title, fontsize=8)
-        ax.set_xticks(plot_data.index)
-        ax.set_xticklabels(plot_data.index, rotation=90, fontsize=6)
-        ax.tick_params(axis='y', labelsize=6)
-        ax.legend(loc='upper left', fontsize=5, frameon=False)
-        ax.margins(0.05)
-        ax2 = ax.twinx()
-        ax2.bar(plot_data.index, plot_data['weight'],
-                alpha=0.5, color='seagreen',
-                label=weight_label)
-        ax2.tick_params(axis='y', labelsize=6)
-        ax2.legend(loc='upper right', fontsize=5, frameon=False)
-    @staticmethod
-    def plot_dlift_ax(ax, plot_data, title, label1, label2, act_label='Actual', weight_label='Earned Exposure'):
-        """Plot double lift chart on given axes."""
-        ax.plot(plot_data.index, plot_data['act_v'],
-                label=act_label, color='red')
-        ax.plot(plot_data.index, plot_data['exp_v1'],
-                label=label1, color='blue')
-        ax.plot(plot_data.index, plot_data['exp_v2'],
-                label=label2, color='black')
-        ax.set_title(title, fontsize=8)
-        ax.set_xticks(plot_data.index)
-        ax.set_xticklabels(plot_data.index, rotation=90, fontsize=6)
-        ax.set_xlabel(f'{label1} / {label2}', fontsize=6)
-        ax.tick_params(axis='y', labelsize=6)
-        ax.legend(loc='upper left', fontsize=5, frameon=False)
-        ax.margins(0.1)
-        ax2 = ax.twinx()
-        ax2.bar(plot_data.index, plot_data['weight'],
-                alpha=0.5, color='seagreen',
-                label=weight_label)
-        ax2.tick_params(axis='y', labelsize=6)
-        ax2.legend(loc='upper right', fontsize=5, frameon=False)
-    @staticmethod
-    def plot_lift_list(pred_model, w_pred_list, w_act_list,
-                       weight_list, tgt_nme, n_bins: int = 10,
-                       fig_nme: str = 'Lift Chart'):
-        """Plot lift chart for model predictions."""
-        if plot_curves_common is not None:
-            save_path = os.path.join(
-                os.getcwd(), 'plot', f'05_{tgt_nme}_{fig_nme}.png')
-            plot_curves_common.plot_lift_curve(
-                pred_model,
-                w_act_list,
-                weight_list,
-                n_bins=n_bins,
-                title=f'Lift Chart of {tgt_nme}',
-                pred_label='Predicted',
-                act_label='Actual',
-                weight_label='Earned Exposure',
-                pred_weighted=False,
-                actual_weighted=True,
-                save_path=save_path,
-                show=False,
-            )
-            return
-        if plt is None:
-            _plot_skip("lift plot")
-            return
-        lift_data = pd.DataFrame({
-            'pred': pred_model,
-            'w_pred': w_pred_list,
-            'act': w_act_list,
-            'weight': weight_list
-        })
-        plot_data = PlotUtils.split_data(lift_data, 'pred', 'weight', n_bins)
-        plot_data['exp_v'] = plot_data['w_pred'] / plot_data['weight']
-        plot_data['act_v'] = plot_data['act'] / plot_data['weight']
-        plot_data.reset_index(inplace=True)
-        fig = plt.figure(figsize=(7, 5))
-        ax = fig.add_subplot(111)
-        PlotUtils.plot_lift_ax(ax, plot_data, f'Lift Chart of {tgt_nme}')
-        plt.subplots_adjust(wspace=0.3)
-        save_path = os.path.join(
-            os.getcwd(), 'plot', f'05_{tgt_nme}_{fig_nme}.png')
-        IOUtils.ensure_parent_dir(save_path)
-        plt.savefig(save_path, dpi=300)
-        plt.close(fig)
-    @staticmethod
-    def plot_dlift_list(pred_model_1, pred_model_2,
-                        model_nme_1, model_nme_2,
-                        tgt_nme,
-                        w_list, w_act_list, n_bins: int = 10,
-                        fig_nme: str = 'Double Lift Chart'):
-        """Plot double lift chart comparing two models."""
-        if plot_curves_common is not None:
-            save_path = os.path.join(
-                os.getcwd(), 'plot', f'06_{tgt_nme}_{fig_nme}.png')
-            plot_curves_common.plot_double_lift_curve(
-                pred_model_1,
-                pred_model_2,
-                w_act_list,
-                w_list,
-                n_bins=n_bins,
-                title=f'Double Lift Chart of {tgt_nme}',
-                label1=model_nme_1,
-                label2=model_nme_2,
-                pred1_weighted=False,
-                pred2_weighted=False,
-                actual_weighted=True,
-                save_path=save_path,
-                show=False,
-            )
-            return
-        if plt is None:
-            _plot_skip("double lift plot")
-            return
-        lift_data = pd.DataFrame({
-            'pred1': pred_model_1,
-            'pred2': pred_model_2,
-            'act': w_act_list,
-            'weight': w_list
-        })
-        lift_data['diff_ly'] = lift_data['pred1'] / lift_data['pred2']
-        lift_data['w_pred1'] = lift_data['pred1'] * lift_data['weight']
-        lift_data['w_pred2'] = lift_data['pred2'] * lift_data['weight']
-        plot_data = PlotUtils.split_data(
-            lift_data, 'diff_ly', 'weight', n_bins)
-        plot_data['exp_v1'] = plot_data['w_pred1'] / plot_data['act']
-        plot_data['exp_v2'] = plot_data['w_pred2'] / plot_data['act']
-        plot_data['act_v'] = plot_data['act']/plot_data['act']
-        plot_data.reset_index(inplace=True)
-        fig = plt.figure(figsize=(7, 5))
-        ax = fig.add_subplot(111)
-        PlotUtils.plot_dlift_ax(
-            ax, plot_data, f'Double Lift Chart of {tgt_nme}', model_nme_1, model_nme_2)
-        plt.subplots_adjust(bottom=0.25, top=0.95, right=0.8)
-        save_path = os.path.join(
-            os.getcwd(), 'plot', f'06_{tgt_nme}_{fig_nme}.png')
-        IOUtils.ensure_parent_dir(save_path)
-        plt.savefig(save_path, dpi=300)
-        plt.close(fig)
-# =============================================================================
-# Backward Compatibility Wrappers
-# =============================================================================
-def split_data(data, col_nme, wgt_nme, n_bins=10):
-    """Legacy function wrapper for PlotUtils.split_data()."""
-    return PlotUtils.split_data(data, col_nme, wgt_nme, n_bins)
-def plot_lift_list(pred_model, w_pred_list, w_act_list,
-                   weight_list, tgt_nme, n_bins=10,
-                   fig_nme='Lift Chart'):
-    """Legacy function wrapper for PlotUtils.plot_lift_list()."""
-    return PlotUtils.plot_lift_list(pred_model, w_pred_list, w_act_list,
-                                    weight_list, tgt_nme, n_bins, fig_nme)
-def plot_dlift_list(pred_model_1, pred_model_2,
-                    model_nme_1, model_nme_2,
-                    tgt_nme,
-                    w_list, w_act_list, n_bins=10,
-                    fig_nme='Double Lift Chart'):
-    """Legacy function wrapper for PlotUtils.plot_dlift_list()."""
-    return PlotUtils.plot_dlift_list(pred_model_1, pred_model_2,
-                                     model_nme_1, model_nme_2,
-                                     tgt_nme, w_list, w_act_list,
-                                     n_bins, fig_nme)

ins_pricing/modelling/core/bayesopt/utils.py DELETED Viewed

@@ -1,105 +0,0 @@
-"""DEPRECATED: Backward compatibility wrapper.
-This module is kept for backward compatibility but will be removed in v0.4.0.
-The monolithic utils.py (1,503 lines) has been split into focused modules:
-    utils/
-    ├── constants.py          - EPS, set_global_seed, etc.
-    ├── io_utils.py           - IOUtils for file operations
-    ├── distributed_utils.py  - DistributedUtils, TrainingUtils
-    ├── torch_trainer_mixin.py - TorchTrainerMixin for PyTorch
-    └── metrics_and_devices.py - Metrics, GPU, device, CV, plotting
-All imports still work the same way:
-    from ins_pricing.modelling.core.bayesopt.utils import EPS, IOUtils
-Or use the new package directly:
-    from ins_pricing.modelling.core.bayesopt.utils import EPS, IOUtils
-    from ins_pricing.modelling.core.bayesopt.utils.constants import EPS
-Both will work identically. The old single-file import will show a deprecation
-warning but continues to function.
-"""
-from __future__ import annotations
-import os
-import warnings
-# Show deprecation warning
-warnings.warn(
-    "Importing from bayesopt.utils (single file) is deprecated. "
-    "This file will be removed in v0.4.0. "
-    "The utils module has been split into focused submodules for better maintainability. "
-    "Imports will continue to work from the utils package without changes.",
-    DeprecationWarning,
-    stacklevel=2
-)
-# Treat this module as a package so submodules resolve even if this file is loaded.
-__path__ = [os.path.join(os.path.dirname(__file__), "utils")]
-# Re-export from refactored utils package for backward compatibility
-from .utils.constants import (
-    EPS,
-    set_global_seed,
-    ensure_parent_dir,
-    compute_batch_size,
-    tweedie_loss,
-    infer_factor_and_cate_list,
-)
-from .utils.io_utils import (
-    IOUtils,
-    csv_to_dict,
-)
-from .utils.distributed_utils import (
-    DistributedUtils,
-    TrainingUtils,
-    free_cuda,
-)
-from .utils.torch_trainer_mixin import (
-    TorchTrainerMixin,
-)
-from .utils.metrics_and_devices import (
-    get_logger,
-    MetricFactory,
-    GPUMemoryManager,
-    DeviceManager,
-    CVStrategyResolver,
-    PlotUtils,
-    split_data,
-    plot_lift_list,
-    plot_dlift_list,
-    _OrderedSplitter,
-)
-# Explicitly list all exports to support IDE auto-completion
-__all__ = [
-    # Constants
-    'EPS',
-    'set_global_seed',
-    'ensure_parent_dir',
-    'compute_batch_size',
-    'tweedie_loss',
-    'infer_factor_and_cate_list',
-    # I/O
-    'IOUtils',
-    'csv_to_dict',
-    # Distributed
-    'DistributedUtils',
-    'TrainingUtils',
-    'free_cuda',
-    # PyTorch
-    'TorchTrainerMixin',
-    # Utilities
-    'get_logger',
-    'MetricFactory',
-    'GPUMemoryManager',
-    'DeviceManager',
-    'CVStrategyResolver',
-    'PlotUtils',
-    'split_data',
-    'plot_lift_list',
-    'plot_dlift_list',
-    '_OrderedSplitter',
-]

ins-pricing 0.4.4__py3-none-any.whl → 0.5.0__py3-none-any.whl

ins-pricing 0.4.4py3-none-any.whl → 0.5.0py3-none-any.whl