PyPI - ins-pricing - Versions diffs - 0.4.5__py3-none-any.whl → 0.5.1__py3-none-any.whl - Mend

ins-pricing 0.4.5py3-none-any.whl → 0.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

ins_pricing/README.md +48 -22
ins_pricing/__init__.py +142 -90
ins_pricing/cli/BayesOpt_entry.py +58 -46
ins_pricing/cli/BayesOpt_incremental.py +77 -110
ins_pricing/cli/Explain_Run.py +42 -23
ins_pricing/cli/Explain_entry.py +551 -577
ins_pricing/cli/Pricing_Run.py +42 -23
ins_pricing/cli/bayesopt_entry_runner.py +51 -16
ins_pricing/cli/utils/bootstrap.py +23 -0
ins_pricing/cli/utils/cli_common.py +256 -256
ins_pricing/cli/utils/cli_config.py +379 -360
ins_pricing/cli/utils/import_resolver.py +375 -358
ins_pricing/cli/utils/notebook_utils.py +256 -242
ins_pricing/cli/watchdog_run.py +216 -198
ins_pricing/frontend/__init__.py +10 -10
ins_pricing/frontend/app.py +132 -61
ins_pricing/frontend/config_builder.py +33 -0
ins_pricing/frontend/example_config.json +11 -0
ins_pricing/frontend/example_workflows.py +1 -1
ins_pricing/frontend/runner.py +340 -388
ins_pricing/governance/__init__.py +20 -20
ins_pricing/governance/release.py +159 -159
ins_pricing/modelling/README.md +1 -1
ins_pricing/modelling/__init__.py +147 -92
ins_pricing/modelling/{core/bayesopt → bayesopt}/README.md +31 -13
ins_pricing/modelling/{core/bayesopt → bayesopt}/__init__.py +64 -102
ins_pricing/modelling/{core/bayesopt → bayesopt}/config_components.py +12 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/config_preprocess.py +589 -552
ins_pricing/modelling/{core/bayesopt → bayesopt}/core.py +987 -958
ins_pricing/modelling/{core/bayesopt → bayesopt}/model_explain_mixin.py +296 -296
ins_pricing/modelling/{core/bayesopt → bayesopt}/model_plotting_mixin.py +488 -548
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/__init__.py +27 -27
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_ft_components.py +349 -342
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_ft_trainer.py +921 -913
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_gnn.py +794 -785
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_resn.py +454 -446
ins_pricing/modelling/bayesopt/trainers/__init__.py +19 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_base.py +1294 -1282
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_ft.py +64 -56
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_glm.py +203 -198
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_gnn.py +333 -325
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_resn.py +279 -267
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_xgb.py +515 -313
ins_pricing/modelling/bayesopt/utils/__init__.py +67 -0
ins_pricing/modelling/bayesopt/utils/constants.py +21 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/distributed_utils.py +193 -186
ins_pricing/modelling/bayesopt/utils/io_utils.py +7 -0
ins_pricing/modelling/bayesopt/utils/losses.py +27 -0
ins_pricing/modelling/bayesopt/utils/metrics_and_devices.py +17 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/torch_trainer_mixin.py +636 -623
ins_pricing/modelling/{core/evaluation.py → evaluation.py} +113 -104
ins_pricing/modelling/explain/__init__.py +55 -55
ins_pricing/modelling/explain/metrics.py +27 -174
ins_pricing/modelling/explain/permutation.py +237 -237
ins_pricing/modelling/plotting/__init__.py +40 -36
ins_pricing/modelling/plotting/compat.py +228 -0
ins_pricing/modelling/plotting/curves.py +572 -572
ins_pricing/modelling/plotting/diagnostics.py +163 -163
ins_pricing/modelling/plotting/geo.py +362 -362
ins_pricing/modelling/plotting/importance.py +121 -121
ins_pricing/pricing/__init__.py +27 -27
ins_pricing/pricing/factors.py +67 -56
ins_pricing/production/__init__.py +35 -25
ins_pricing/production/{predict.py → inference.py} +140 -57
ins_pricing/production/monitoring.py +8 -21
ins_pricing/reporting/__init__.py +11 -11
ins_pricing/setup.py +1 -1
ins_pricing/tests/production/test_inference.py +90 -0
ins_pricing/utils/__init__.py +112 -78
ins_pricing/utils/device.py +258 -237
ins_pricing/utils/features.py +53 -0
ins_pricing/utils/io.py +72 -0
ins_pricing/utils/logging.py +34 -1
ins_pricing/{modelling/core/bayesopt/utils → utils}/losses.py +125 -129
ins_pricing/utils/metrics.py +158 -24
ins_pricing/utils/numerics.py +76 -0
ins_pricing/utils/paths.py +9 -1
ins_pricing/utils/profiling.py +8 -4
{ins_pricing-0.4.5.dist-info → ins_pricing-0.5.1.dist-info}/METADATA +1 -1
ins_pricing-0.5.1.dist-info/RECORD +132 -0
ins_pricing/modelling/core/BayesOpt.py +0 -146
ins_pricing/modelling/core/__init__.py +0 -1
ins_pricing/modelling/core/bayesopt/trainers/__init__.py +0 -19
ins_pricing/modelling/core/bayesopt/utils/__init__.py +0 -86
ins_pricing/modelling/core/bayesopt/utils/constants.py +0 -183
ins_pricing/modelling/core/bayesopt/utils/io_utils.py +0 -126
ins_pricing/modelling/core/bayesopt/utils/metrics_and_devices.py +0 -555
ins_pricing/modelling/core/bayesopt/utils.py +0 -105
ins_pricing/modelling/core/bayesopt/utils_backup.py +0 -1503
ins_pricing/tests/production/test_predict.py +0 -233
ins_pricing-0.4.5.dist-info/RECORD +0 -130
{ins_pricing-0.4.5.dist-info → ins_pricing-0.5.1.dist-info}/WHEEL +0 -0
{ins_pricing-0.4.5.dist-info → ins_pricing-0.5.1.dist-info}/top_level.txt +0 -0

ins_pricing/modelling/bayesopt/utils/__init__.py ADDED Viewed

@@ -0,0 +1,67 @@
+"""Backward compatibility re-exports for bayesopt utilities.
+This module keeps legacy imports working while routing general helpers
+through ins_pricing.utils and leaving bayesopt-specific utilities in place.
+"""
+from __future__ import annotations
+# Constants and simple utilities
+from ins_pricing.modelling.bayesopt.utils.constants import (
+    EPS,
+    set_global_seed,
+    ensure_parent_dir,
+    compute_batch_size,
+    tweedie_loss,
+    infer_factor_and_cate_list,
+)
+# I/O utilities
+from ins_pricing.modelling.bayesopt.utils.io_utils import (
+    IOUtils,
+    csv_to_dict,
+)
+# Distributed training
+from ins_pricing.modelling.bayesopt.utils.distributed_utils import (
+    DistributedUtils,
+    TrainingUtils,
+    free_cuda,
+)
+# PyTorch training mixin
+from ins_pricing.modelling.bayesopt.utils.torch_trainer_mixin import (
+    TorchTrainerMixin,
+)
+# Metrics and device helpers (shared utilities)
+from ins_pricing.modelling.bayesopt.utils.metrics_and_devices import (
+    get_logger,
+    MetricFactory,
+    GPUMemoryManager,
+    DeviceManager,
+)
+__all__ = [
+    # Constants
+    'EPS',
+    'set_global_seed',
+    'ensure_parent_dir',
+    'compute_batch_size',
+    'tweedie_loss',
+    'infer_factor_and_cate_list',
+    # I/O
+    'IOUtils',
+    'csv_to_dict',
+    # Distributed
+    'DistributedUtils',
+    'TrainingUtils',
+    'free_cuda',
+    # PyTorch
+    'TorchTrainerMixin',
+    # Utilities
+    'get_logger',
+    'MetricFactory',
+    'GPUMemoryManager',
+    'DeviceManager',
+]

ins_pricing/modelling/bayesopt/utils/constants.py ADDED Viewed

@@ -0,0 +1,21 @@
+"""Backward-compatible re-exports for numerical utilities."""
+from __future__ import annotations
+from ins_pricing.utils.features import infer_factor_and_cate_list
+from ins_pricing.utils.io import ensure_parent_dir
+from ins_pricing.utils.numerics import (
+    EPS,
+    compute_batch_size,
+    set_global_seed,
+    tweedie_loss,
+)
+__all__ = [
+    "EPS",
+    "set_global_seed",
+    "ensure_parent_dir",
+    "compute_batch_size",
+    "tweedie_loss",
+    "infer_factor_and_cate_list",
+]

ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/distributed_utils.py RENAMED Viewed

@@ -1,186 +1,193 @@
-"""Distributed training utilities for PyTorch DDP.
-This module contains:
-- DistributedUtils for DDP setup and process coordination
-- TrainingUtils for CUDA memory management
-- free_cuda() for legacy compatibility
-"""
-from __future__ import annotations
-import gc
-import os
-from datetime import timedelta
-from typing import Optional
-import torch
-import torch.distributed as dist
-def _select_ddp_backend() -> str:
-    """Select the appropriate DDP backend based on system capabilities.
-    Returns:
-        "nccl" if CUDA is available and NCCL is supported (non-Windows),
-        otherwise "gloo"
-    """
-    if not torch.cuda.is_available():
-        return "gloo"
-    if os.name == "nt":  # Windows doesn't support NCCL
-        return "gloo"
-    try:
-        nccl_available = getattr(dist, "is_nccl_available", lambda: False)()
-        return "nccl" if nccl_available else "gloo"
-    except Exception:
-        return "gloo"
-def _get_ddp_timeout() -> timedelta:
-    """Get the DDP timeout from environment variable.
-    Returns:
-        timedelta for DDP timeout (default: 1800 seconds)
-    """
-    timeout_seconds = int(os.environ.get("BAYESOPT_DDP_TIMEOUT_SECONDS", "1800"))
-    return timedelta(seconds=max(1, timeout_seconds))
-def _cache_ddp_state(local_rank: int, rank: int, world_size: int) -> tuple:
-    """Cache and return DDP state tuple."""
-    state = (True, local_rank, rank, world_size)
-    DistributedUtils._cached_state = state
-    return state
-class DistributedUtils:
-    """Utilities for distributed data parallel training.
-    This class provides methods for:
-    - Initializing DDP process groups
-    - Checking process rank and world size
-    - Cleanup after distributed training
-    """
-    _cached_state: Optional[tuple] = None
-    @staticmethod
-    def setup_ddp():
-        """Initialize the DDP process group for distributed training.
-        Returns:
-            Tuple of (success, local_rank, rank, world_size)
-        """
-        # Return cached state if already initialized
-        if dist.is_initialized():
-            if DistributedUtils._cached_state is None:
-                DistributedUtils._cached_state = _cache_ddp_state(
-                    int(os.environ.get("LOCAL_RANK", 0)),
-                    dist.get_rank(),
-                    dist.get_world_size(),
-                )
-            return DistributedUtils._cached_state
-        # Check for required environment variables
-        if 'RANK' not in os.environ or 'WORLD_SIZE' not in os.environ:
-            print(
-                f">>> DDP Setup Failed: RANK or WORLD_SIZE not found in env. "
-                f"Keys found: {list(os.environ.keys())}"
-            )
-            print(">>> Hint: launch with torchrun --nproc_per_node=<N> <script.py>")
-            return False, 0, 0, 1
-        rank = int(os.environ["RANK"])
-        world_size = int(os.environ["WORLD_SIZE"])
-        local_rank = int(os.environ.get("LOCAL_RANK", 0))
-        # Windows CUDA DDP is not supported
-        if os.name == "nt" and torch.cuda.is_available() and world_size > 1:
-            print(
-                ">>> DDP Setup Disabled: Windows CUDA DDP is not supported. "
-                "Falling back to single process."
-            )
-            return False, 0, 0, 1
-        # Set CUDA device for this process
-        if torch.cuda.is_available():
-            torch.cuda.set_device(local_rank)
-        # Initialize process group
-        backend = _select_ddp_backend()
-        timeout = _get_ddp_timeout()
-        dist.init_process_group(backend=backend, init_method="env://", timeout=timeout)
-        print(
-            f">>> DDP Initialized ({backend}, timeout={timeout.total_seconds():.0f}s): "
-            f"Rank {rank}/{world_size}, Local Rank {local_rank}"
-        )
-        return _cache_ddp_state(local_rank, rank, world_size)
-    @staticmethod
-    def cleanup_ddp():
-        """Destroy the DDP process group and clear cached state."""
-        if dist.is_initialized():
-            dist.destroy_process_group()
-        DistributedUtils._cached_state = None
-    @staticmethod
-    def is_main_process():
-        """Check if current process is rank 0 (main process).
-        Returns:
-            True if main process or DDP not initialized
-        """
-        return not dist.is_initialized() or dist.get_rank() == 0
-    @staticmethod
-    def world_size() -> int:
-        """Get the total number of processes in the distributed group.
-        Returns:
-            World size (1 if DDP not initialized)
-        """
-        return dist.get_world_size() if dist.is_initialized() else 1
-class TrainingUtils:
-    """General training utilities including CUDA management."""
-    @staticmethod
-    def free_cuda() -> None:
-        """Release CUDA memory and clear cache.
-        This performs aggressive cleanup:
-        1. Move all PyTorch models to CPU
-        2. Run garbage collection
-        3. Clear CUDA cache
-        """
-        print(">>> Moving all models to CPU...")
-        for obj in gc.get_objects():
-            try:
-                if hasattr(obj, "to") and callable(obj.to):
-                    obj.to("cpu")
-            except Exception:
-                pass
-        print(">>> Releasing tensor/optimizer/DataLoader references...")
-        gc.collect()
-        print(">>> Clearing CUDA cache...")
-        if torch.cuda.is_available():
-            torch.cuda.empty_cache()
-            torch.cuda.synchronize()
-            print(">>> CUDA memory released.")
-        else:
-            print(">>> CUDA not available; cleanup skipped.")
-# Backward compatibility function wrapper
-def free_cuda():
-    """Legacy function wrapper for CUDA memory cleanup.
-    This function calls TrainingUtils.free_cuda() for backward compatibility.
-    """
-    TrainingUtils.free_cuda()
+"""Distributed training utilities for PyTorch DDP.
+This module contains:
+- DistributedUtils for DDP setup and process coordination
+- TrainingUtils for CUDA memory management
+- free_cuda() for legacy compatibility
+"""
+from __future__ import annotations
+import gc
+import os
+from datetime import timedelta
+from typing import Optional
+import torch
+import torch.distributed as dist
+from ins_pricing.utils import get_logger, log_print
+_logger = get_logger("ins_pricing.modelling.bayesopt.utils.distributed_utils")
+def _log(*args, **kwargs) -> None:
+    log_print(_logger, *args, **kwargs)
+def _select_ddp_backend() -> str:
+    """Select the appropriate DDP backend based on system capabilities.
+    Returns:
+        "nccl" if CUDA is available and NCCL is supported (non-Windows),
+        otherwise "gloo"
+    """
+    if not torch.cuda.is_available():
+        return "gloo"
+    if os.name == "nt":  # Windows doesn't support NCCL
+        return "gloo"
+    try:
+        nccl_available = getattr(dist, "is_nccl_available", lambda: False)()
+        return "nccl" if nccl_available else "gloo"
+    except Exception:
+        return "gloo"
+def _get_ddp_timeout() -> timedelta:
+    """Get the DDP timeout from environment variable.
+    Returns:
+        timedelta for DDP timeout (default: 1800 seconds)
+    """
+    timeout_seconds = int(os.environ.get("BAYESOPT_DDP_TIMEOUT_SECONDS", "1800"))
+    return timedelta(seconds=max(1, timeout_seconds))
+def _cache_ddp_state(local_rank: int, rank: int, world_size: int) -> tuple:
+    """Cache and return DDP state tuple."""
+    state = (True, local_rank, rank, world_size)
+    DistributedUtils._cached_state = state
+    return state
+class DistributedUtils:
+    """Utilities for distributed data parallel training.
+    This class provides methods for:
+    - Initializing DDP process groups
+    - Checking process rank and world size
+    - Cleanup after distributed training
+    """
+    _cached_state: Optional[tuple] = None
+    @staticmethod
+    def setup_ddp():
+        """Initialize the DDP process group for distributed training.
+        Returns:
+            Tuple of (success, local_rank, rank, world_size)
+        """
+        # Return cached state if already initialized
+        if dist.is_initialized():
+            if DistributedUtils._cached_state is None:
+                DistributedUtils._cached_state = _cache_ddp_state(
+                    int(os.environ.get("LOCAL_RANK", 0)),
+                    dist.get_rank(),
+                    dist.get_world_size(),
+                )
+            return DistributedUtils._cached_state
+        # Check for required environment variables
+        if 'RANK' not in os.environ or 'WORLD_SIZE' not in os.environ:
+            _log(
+                f">>> DDP Setup Failed: RANK or WORLD_SIZE not found in env. "
+                f"Keys found: {list(os.environ.keys())}"
+            )
+            _log(">>> Hint: launch with torchrun --nproc_per_node=<N> <script.py>")
+            return False, 0, 0, 1
+        rank = int(os.environ["RANK"])
+        world_size = int(os.environ["WORLD_SIZE"])
+        local_rank = int(os.environ.get("LOCAL_RANK", 0))
+        # Windows CUDA DDP is not supported
+        if os.name == "nt" and torch.cuda.is_available() and world_size > 1:
+            _log(
+                ">>> DDP Setup Disabled: Windows CUDA DDP is not supported. "
+                "Falling back to single process."
+            )
+            return False, 0, 0, 1
+        # Set CUDA device for this process
+        if torch.cuda.is_available():
+            torch.cuda.set_device(local_rank)
+        # Initialize process group
+        backend = _select_ddp_backend()
+        timeout = _get_ddp_timeout()
+        dist.init_process_group(backend=backend, init_method="env://", timeout=timeout)
+        _log(
+            f">>> DDP Initialized ({backend}, timeout={timeout.total_seconds():.0f}s): "
+            f"Rank {rank}/{world_size}, Local Rank {local_rank}"
+        )
+        return _cache_ddp_state(local_rank, rank, world_size)
+    @staticmethod
+    def cleanup_ddp():
+        """Destroy the DDP process group and clear cached state."""
+        if dist.is_initialized():
+            dist.destroy_process_group()
+        DistributedUtils._cached_state = None
+    @staticmethod
+    def is_main_process():
+        """Check if current process is rank 0 (main process).
+        Returns:
+            True if main process or DDP not initialized
+        """
+        return not dist.is_initialized() or dist.get_rank() == 0
+    @staticmethod
+    def world_size() -> int:
+        """Get the total number of processes in the distributed group.
+        Returns:
+            World size (1 if DDP not initialized)
+        """
+        return dist.get_world_size() if dist.is_initialized() else 1
+class TrainingUtils:
+    """General training utilities including CUDA management."""
+    @staticmethod
+    def free_cuda() -> None:
+        """Release CUDA memory and clear cache.
+        This performs aggressive cleanup:
+        1. Move all PyTorch models to CPU
+        2. Run garbage collection
+        3. Clear CUDA cache
+        """
+        _log(">>> Moving all models to CPU...")
+        for obj in gc.get_objects():
+            try:
+                if hasattr(obj, "to") and callable(obj.to):
+                    obj.to("cpu")
+            except Exception:
+                pass
+        _log(">>> Releasing tensor/optimizer/DataLoader references...")
+        gc.collect()
+        _log(">>> Clearing CUDA cache...")
+        if torch.cuda.is_available():
+            torch.cuda.empty_cache()
+            torch.cuda.synchronize()
+            _log(">>> CUDA memory released.")
+        else:
+            _log(">>> CUDA not available; cleanup skipped.")
+# Backward compatibility function wrapper
+def free_cuda():
+    """Legacy function wrapper for CUDA memory cleanup.
+    This function calls TrainingUtils.free_cuda() for backward compatibility.
+    """
+    TrainingUtils.free_cuda()

ins_pricing/modelling/bayesopt/utils/io_utils.py ADDED Viewed

@@ -0,0 +1,7 @@
+"""Backward-compatible re-exports for IO utilities."""
+from __future__ import annotations
+from ins_pricing.utils.io import IOUtils, csv_to_dict, ensure_parent_dir
+__all__ = ["IOUtils", "csv_to_dict", "ensure_parent_dir"]

ins_pricing/modelling/bayesopt/utils/losses.py ADDED Viewed

@@ -0,0 +1,27 @@
+"""Backward-compatible re-exports for loss utilities."""
+from __future__ import annotations
+from ins_pricing.utils.losses import (
+    CLASSIFICATION_LOSSES,
+    LOSS_ALIASES,
+    REGRESSION_LOSSES,
+    infer_loss_name_from_model_name,
+    loss_requires_positive,
+    normalize_loss_name,
+    regression_loss,
+    resolve_tweedie_power,
+    resolve_xgb_objective,
+)
+__all__ = [
+    "LOSS_ALIASES",
+    "REGRESSION_LOSSES",
+    "CLASSIFICATION_LOSSES",
+    "normalize_loss_name",
+    "infer_loss_name_from_model_name",
+    "resolve_tweedie_power",
+    "resolve_xgb_objective",
+    "regression_loss",
+    "loss_requires_positive",
+]

ins_pricing/modelling/bayesopt/utils/metrics_and_devices.py ADDED Viewed

@@ -0,0 +1,17 @@
+"""Backward-compatible re-exports for metrics and device utilities."""
+from __future__ import annotations
+from ins_pricing.utils import (
+    DeviceManager,
+    GPUMemoryManager,
+    MetricFactory,
+    get_logger,
+)
+__all__ = [
+    "get_logger",
+    "MetricFactory",
+    "GPUMemoryManager",
+    "DeviceManager",
+]

ins-pricing 0.4.5__py3-none-any.whl → 0.5.1__py3-none-any.whl

ins-pricing 0.4.5py3-none-any.whl → 0.5.1py3-none-any.whl