PyPI - ins-pricing - Versions diffs - 0.4.5__py3-none-any.whl → 0.5.1__py3-none-any.whl - Mend

ins-pricing 0.4.5py3-none-any.whl → 0.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

ins_pricing/README.md +48 -22
ins_pricing/__init__.py +142 -90
ins_pricing/cli/BayesOpt_entry.py +58 -46
ins_pricing/cli/BayesOpt_incremental.py +77 -110
ins_pricing/cli/Explain_Run.py +42 -23
ins_pricing/cli/Explain_entry.py +551 -577
ins_pricing/cli/Pricing_Run.py +42 -23
ins_pricing/cli/bayesopt_entry_runner.py +51 -16
ins_pricing/cli/utils/bootstrap.py +23 -0
ins_pricing/cli/utils/cli_common.py +256 -256
ins_pricing/cli/utils/cli_config.py +379 -360
ins_pricing/cli/utils/import_resolver.py +375 -358
ins_pricing/cli/utils/notebook_utils.py +256 -242
ins_pricing/cli/watchdog_run.py +216 -198
ins_pricing/frontend/__init__.py +10 -10
ins_pricing/frontend/app.py +132 -61
ins_pricing/frontend/config_builder.py +33 -0
ins_pricing/frontend/example_config.json +11 -0
ins_pricing/frontend/example_workflows.py +1 -1
ins_pricing/frontend/runner.py +340 -388
ins_pricing/governance/__init__.py +20 -20
ins_pricing/governance/release.py +159 -159
ins_pricing/modelling/README.md +1 -1
ins_pricing/modelling/__init__.py +147 -92
ins_pricing/modelling/{core/bayesopt → bayesopt}/README.md +31 -13
ins_pricing/modelling/{core/bayesopt → bayesopt}/__init__.py +64 -102
ins_pricing/modelling/{core/bayesopt → bayesopt}/config_components.py +12 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/config_preprocess.py +589 -552
ins_pricing/modelling/{core/bayesopt → bayesopt}/core.py +987 -958
ins_pricing/modelling/{core/bayesopt → bayesopt}/model_explain_mixin.py +296 -296
ins_pricing/modelling/{core/bayesopt → bayesopt}/model_plotting_mixin.py +488 -548
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/__init__.py +27 -27
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_ft_components.py +349 -342
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_ft_trainer.py +921 -913
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_gnn.py +794 -785
ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_resn.py +454 -446
ins_pricing/modelling/bayesopt/trainers/__init__.py +19 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_base.py +1294 -1282
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_ft.py +64 -56
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_glm.py +203 -198
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_gnn.py +333 -325
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_resn.py +279 -267
ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_xgb.py +515 -313
ins_pricing/modelling/bayesopt/utils/__init__.py +67 -0
ins_pricing/modelling/bayesopt/utils/constants.py +21 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/distributed_utils.py +193 -186
ins_pricing/modelling/bayesopt/utils/io_utils.py +7 -0
ins_pricing/modelling/bayesopt/utils/losses.py +27 -0
ins_pricing/modelling/bayesopt/utils/metrics_and_devices.py +17 -0
ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/torch_trainer_mixin.py +636 -623
ins_pricing/modelling/{core/evaluation.py → evaluation.py} +113 -104
ins_pricing/modelling/explain/__init__.py +55 -55
ins_pricing/modelling/explain/metrics.py +27 -174
ins_pricing/modelling/explain/permutation.py +237 -237
ins_pricing/modelling/plotting/__init__.py +40 -36
ins_pricing/modelling/plotting/compat.py +228 -0
ins_pricing/modelling/plotting/curves.py +572 -572
ins_pricing/modelling/plotting/diagnostics.py +163 -163
ins_pricing/modelling/plotting/geo.py +362 -362
ins_pricing/modelling/plotting/importance.py +121 -121
ins_pricing/pricing/__init__.py +27 -27
ins_pricing/pricing/factors.py +67 -56
ins_pricing/production/__init__.py +35 -25
ins_pricing/production/{predict.py → inference.py} +140 -57
ins_pricing/production/monitoring.py +8 -21
ins_pricing/reporting/__init__.py +11 -11
ins_pricing/setup.py +1 -1
ins_pricing/tests/production/test_inference.py +90 -0
ins_pricing/utils/__init__.py +112 -78
ins_pricing/utils/device.py +258 -237
ins_pricing/utils/features.py +53 -0
ins_pricing/utils/io.py +72 -0
ins_pricing/utils/logging.py +34 -1
ins_pricing/{modelling/core/bayesopt/utils → utils}/losses.py +125 -129
ins_pricing/utils/metrics.py +158 -24
ins_pricing/utils/numerics.py +76 -0
ins_pricing/utils/paths.py +9 -1
ins_pricing/utils/profiling.py +8 -4
{ins_pricing-0.4.5.dist-info → ins_pricing-0.5.1.dist-info}/METADATA +1 -1
ins_pricing-0.5.1.dist-info/RECORD +132 -0
ins_pricing/modelling/core/BayesOpt.py +0 -146
ins_pricing/modelling/core/__init__.py +0 -1
ins_pricing/modelling/core/bayesopt/trainers/__init__.py +0 -19
ins_pricing/modelling/core/bayesopt/utils/__init__.py +0 -86
ins_pricing/modelling/core/bayesopt/utils/constants.py +0 -183
ins_pricing/modelling/core/bayesopt/utils/io_utils.py +0 -126
ins_pricing/modelling/core/bayesopt/utils/metrics_and_devices.py +0 -555
ins_pricing/modelling/core/bayesopt/utils.py +0 -105
ins_pricing/modelling/core/bayesopt/utils_backup.py +0 -1503
ins_pricing/tests/production/test_predict.py +0 -233
ins_pricing-0.4.5.dist-info/RECORD +0 -130
{ins_pricing-0.4.5.dist-info → ins_pricing-0.5.1.dist-info}/WHEEL +0 -0
{ins_pricing-0.4.5.dist-info → ins_pricing-0.5.1.dist-info}/top_level.txt +0 -0

ins_pricing/frontend/app.py CHANGED Viewed

@@ -17,16 +17,31 @@ from ins_pricing.frontend.ft_workflow import FTWorkflowHelper
 from ins_pricing.frontend.runner import TaskRunner
 from ins_pricing.frontend.config_builder import ConfigBuilder
 import json
+import tempfile
 import sys
 import inspect
+import importlib.util
 from pathlib import Path
-from typing import Optional, Dict, Any, Callable, Iterable, Tuple
+from typing import Optional, Dict, Any, Callable, Iterable, Tuple, Generator
 import threading
 import queue
 import time
-# Add parent directory to path to import ins_pricing modules
-sys.path.insert(0, str(Path(__file__).parent.parent.parent))
+def _ensure_repo_root() -> None:
+    if __package__ not in {None, ""}:
+        return
+    if importlib.util.find_spec("ins_pricing") is not None:
+        return
+    bootstrap_path = Path(__file__).resolve().parents[1] / "cli" / "utils" / "bootstrap.py"
+    spec = importlib.util.spec_from_file_location("ins_pricing.cli.utils.bootstrap", bootstrap_path)
+    if spec is None or spec.loader is None:
+        return
+    module = importlib.util.module_from_spec(spec)
+    spec.loader.exec_module(module)
+    module.ensure_repo_root()
+_ensure_repo_root()
 os.environ.setdefault("GRADIO_ANALYTICS_ENABLED", "False")
 os.environ.setdefault("GRADIO_TELEMETRY_ENABLED", "False")
@@ -112,10 +127,21 @@ class PricingApp:
         output_dir: str,
         use_gpu: bool,
         model_keys: str,
-        max_evals: int,
-        xgb_max_depth_max: int,
-        xgb_n_estimators_max: int,
-    ) -> tuple[str, str]:
+        max_evals: int,
+        xgb_max_depth_max: int,
+        xgb_n_estimators_max: int,
+        xgb_gpu_id: int,
+        xgb_cleanup_per_fold: bool,
+        xgb_cleanup_synchronize: bool,
+        xgb_use_dmatrix: bool,
+        ft_cleanup_per_fold: bool,
+        ft_cleanup_synchronize: bool,
+        resn_cleanup_per_fold: bool,
+        resn_cleanup_synchronize: bool,
+        gnn_cleanup_per_fold: bool,
+        gnn_cleanup_synchronize: bool,
+        optuna_cleanup_synchronize: bool,
+    ) -> tuple[str, str]:
         """Build configuration from UI parameters."""
         try:
             # Parse comma-separated lists
@@ -148,10 +174,21 @@ class PricingApp:
                 output_dir=output_dir,
                 use_gpu=use_gpu,
                 model_keys=model_keys,
-                max_evals=max_evals,
-                xgb_max_depth_max=xgb_max_depth_max,
-                xgb_n_estimators_max=xgb_n_estimators_max,
-            )
+                max_evals=max_evals,
+                xgb_max_depth_max=xgb_max_depth_max,
+                xgb_n_estimators_max=xgb_n_estimators_max,
+                xgb_gpu_id=xgb_gpu_id,
+                xgb_cleanup_per_fold=xgb_cleanup_per_fold,
+                xgb_cleanup_synchronize=xgb_cleanup_synchronize,
+                xgb_use_dmatrix=xgb_use_dmatrix,
+                ft_cleanup_per_fold=ft_cleanup_per_fold,
+                ft_cleanup_synchronize=ft_cleanup_synchronize,
+                resn_cleanup_per_fold=resn_cleanup_per_fold,
+                resn_cleanup_synchronize=resn_cleanup_synchronize,
+                gnn_cleanup_per_fold=gnn_cleanup_per_fold,
+                gnn_cleanup_synchronize=gnn_cleanup_synchronize,
+                optuna_cleanup_synchronize=optuna_cleanup_synchronize,
+            )
             is_valid, msg = self.config_builder.validate_config(config)
             if not is_valid:
@@ -180,54 +217,60 @@ class PricingApp:
         except Exception as e:
             return f"Error saving config: {str(e)}"
-    def run_training(self, config_json: str) -> tuple[str, str]:
+    def run_training(self, config_json: str) -> Generator[tuple[str, str], None, None]:
         """
         Run task (training, explain, plotting, etc.) with the current configuration.
         The task type is automatically detected from config.runner.mode.
         Supported modes: entry (training), explain, incremental, watchdog, etc.
         """
-        try:
-            temp_config_path = None
-            if config_json:
-                config = json.loads(config_json)
-                task_mode = config.get('runner', {}).get('mode', 'entry')
-                base_dir = self.current_config_dir or Path.cwd()
-                temp_config_path = (base_dir / "temp_config.json").resolve()
-                with open(temp_config_path, 'w', encoding='utf-8') as f:
-                    json.dump(config, f, indent=2)
-                config_path = temp_config_path
-            elif self.current_config_path and self.current_config_path.exists():
-                config_path = self.current_config_path
-                config = json.loads(config_path.read_text(encoding="utf-8"))
-                task_mode = config.get('runner', {}).get('mode', 'entry')
-            elif self.current_config:
-                config = self.current_config
-                task_mode = config.get('runner', {}).get('mode', 'entry')
-                temp_config_path = (Path.cwd() / "temp_config.json").resolve()
-                with open(temp_config_path, 'w', encoding='utf-8') as f:
-                    json.dump(config, f, indent=2)
-                config_path = temp_config_path
-            else:
-                return "No configuration provided", ""
-            log_generator = self.runner.run_task(str(config_path))
-            # Collect logs
-            full_log = ""
-            for log_line in log_generator:
-                full_log += log_line + "\n"
-                yield f"Task [{task_mode}] in progress...", full_log
-            # Clean up
-            if temp_config_path and temp_config_path.exists():
-                temp_config_path.unlink()
-            yield f"Task [{task_mode}] completed!", full_log
-        except Exception as e:
-            error_msg = f"Error during task execution: {str(e)}"
-            yield error_msg, error_msg
+        temp_config_path: Optional[Path] = None
+        try:
+            if config_json:
+                config = json.loads(config_json)
+                task_mode = config.get('runner', {}).get('mode', 'entry')
+                base_dir = self.current_config_dir or Path.cwd()
+                fd, temp_path = tempfile.mkstemp(prefix="temp_config_", suffix=".json", dir=base_dir)
+                temp_config_path = Path(temp_path)
+                with os.fdopen(fd, 'w', encoding='utf-8') as f:
+                    json.dump(config, f, indent=2)
+                config_path = temp_config_path
+            elif self.current_config_path and self.current_config_path.exists():
+                config_path = self.current_config_path
+                config = json.loads(config_path.read_text(encoding="utf-8"))
+                task_mode = config.get('runner', {}).get('mode', 'entry')
+            elif self.current_config:
+                config = self.current_config
+                task_mode = config.get('runner', {}).get('mode', 'entry')
+                base_dir = Path.cwd()
+                fd, temp_path = tempfile.mkstemp(prefix="temp_config_", suffix=".json", dir=base_dir)
+                temp_config_path = Path(temp_path)
+                with os.fdopen(fd, 'w', encoding='utf-8') as f:
+                    json.dump(config, f, indent=2)
+                config_path = temp_config_path
+            else:
+                yield "No configuration provided", ""
+                return
+            log_generator = self.runner.run_task(str(config_path))
+            # Collect logs
+            full_log = ""
+            for log_line in log_generator:
+                full_log += log_line + "\n"
+                yield f"Task [{task_mode}] in progress...", full_log
+            yield f"Task [{task_mode}] completed!", full_log
+        except Exception as e:
+            error_msg = f"Error during task execution: {str(e)}"
+            yield error_msg, error_msg
+        finally:
+            if temp_config_path is not None:
+                try:
+                    temp_config_path.unlink(missing_ok=True)
+                except Exception:
+                    pass
     def prepare_ft_step1(self, config_json: str, use_ddp: bool, nproc: int) -> tuple[str, str]:
         """Prepare FT Step 1 configuration."""
@@ -551,11 +594,34 @@ def create_ui():
                         label="Max Evaluations", value=50, precision=0)
                 with gr.Column():
-                    gr.Markdown("#### XGBoost Settings")
-                    xgb_max_depth_max = gr.Number(
-                        label="XGB Max Depth", value=25, precision=0)
-                    xgb_n_estimators_max = gr.Number(
-                        label="XGB Max Estimators", value=500, precision=0)
+                    gr.Markdown("#### XGBoost Settings")
+                    xgb_max_depth_max = gr.Number(
+                        label="XGB Max Depth", value=25, precision=0)
+                    xgb_n_estimators_max = gr.Number(
+                        label="XGB Max Estimators", value=500, precision=0)
+                    xgb_gpu_id = gr.Number(
+                        label="XGB GPU ID", value=0, precision=0)
+                    xgb_cleanup_per_fold = gr.Checkbox(
+                        label="XGB Cleanup Per Fold", value=False)
+                    xgb_cleanup_synchronize = gr.Checkbox(
+                        label="XGB Cleanup Synchronize", value=False)
+                    xgb_use_dmatrix = gr.Checkbox(
+                        label="XGB Use DMatrix", value=True)
+                    gr.Markdown("#### Fold Cleanup")
+                    ft_cleanup_per_fold = gr.Checkbox(
+                        label="FT Cleanup Per Fold", value=False)
+                    ft_cleanup_synchronize = gr.Checkbox(
+                        label="FT Cleanup Synchronize", value=False)
+                    resn_cleanup_per_fold = gr.Checkbox(
+                        label="ResNet Cleanup Per Fold", value=False)
+                    resn_cleanup_synchronize = gr.Checkbox(
+                        label="ResNet Cleanup Synchronize", value=False)
+                    gnn_cleanup_per_fold = gr.Checkbox(
+                        label="GNN Cleanup Per Fold", value=False)
+                    gnn_cleanup_synchronize = gr.Checkbox(
+                        label="GNN Cleanup Synchronize", value=False)
+                    optuna_cleanup_synchronize = gr.Checkbox(
+                        label="Optuna Cleanup Synchronize", value=False)
             with gr.Row():
                 build_btn = gr.Button(
@@ -836,9 +902,14 @@ def create_ui():
                 data_dir, model_list, model_categories, target, weight,
                 feature_list, categorical_features, task_type, prop_test,
                 holdout_ratio, val_ratio, split_strategy, rand_seed, epochs,
-                output_dir, use_gpu, model_keys, max_evals,
-                xgb_max_depth_max, xgb_n_estimators_max
-            ],
+                output_dir, use_gpu, model_keys, max_evals,
+                xgb_max_depth_max, xgb_n_estimators_max,
+                xgb_gpu_id, xgb_cleanup_per_fold, xgb_cleanup_synchronize,
+                xgb_use_dmatrix, ft_cleanup_per_fold, ft_cleanup_synchronize,
+                resn_cleanup_per_fold, resn_cleanup_synchronize,
+                gnn_cleanup_per_fold, gnn_cleanup_synchronize,
+                optuna_cleanup_synchronize
+            ],
             outputs=[build_status, config_json]
         )

ins_pricing/frontend/config_builder.py CHANGED Viewed

@@ -148,6 +148,17 @@ class ConfigBuilder:
         max_evals: int = 50,
         xgb_max_depth_max: int = 25,
         xgb_n_estimators_max: int = 500,
+        xgb_gpu_id: Optional[int] = None,
+        xgb_cleanup_per_fold: bool = False,
+        xgb_cleanup_synchronize: bool = False,
+        xgb_use_dmatrix: bool = True,
+        ft_cleanup_per_fold: bool = False,
+        ft_cleanup_synchronize: bool = False,
+        resn_cleanup_per_fold: bool = False,
+        resn_cleanup_synchronize: bool = False,
+        gnn_cleanup_per_fold: bool = False,
+        gnn_cleanup_synchronize: bool = False,
+        optuna_cleanup_synchronize: bool = False,
         nproc_per_node: int = 2,
     ) -> Dict[str, Any]:
         """
@@ -174,6 +185,17 @@ class ConfigBuilder:
             max_evals: Maximum number of evaluations for optimization
             xgb_max_depth_max: Maximum depth for XGBoost
             xgb_n_estimators_max: Maximum estimators for XGBoost
+            xgb_gpu_id: XGBoost GPU device id (None = default)
+            xgb_cleanup_per_fold: Cleanup GPU memory per XGBoost fold
+            xgb_cleanup_synchronize: Synchronize CUDA during XGBoost cleanup
+            xgb_use_dmatrix: Use xgb.train with DMatrix/QuantileDMatrix
+            ft_cleanup_per_fold: Cleanup GPU memory per FT fold
+            ft_cleanup_synchronize: Synchronize CUDA during FT cleanup
+            resn_cleanup_per_fold: Cleanup GPU memory per ResNet fold
+            resn_cleanup_synchronize: Synchronize CUDA during ResNet cleanup
+            gnn_cleanup_per_fold: Cleanup GPU memory per GNN fold
+            gnn_cleanup_synchronize: Synchronize CUDA during GNN cleanup
+            optuna_cleanup_synchronize: Synchronize CUDA during Optuna cleanup
             nproc_per_node: Number of processes per node
         Returns:
@@ -204,6 +226,17 @@ class ConfigBuilder:
             "use_gpu": use_gpu,
             "xgb_max_depth_max": xgb_max_depth_max,
             "xgb_n_estimators_max": xgb_n_estimators_max,
+            "xgb_gpu_id": xgb_gpu_id,
+            "xgb_cleanup_per_fold": xgb_cleanup_per_fold,
+            "xgb_cleanup_synchronize": xgb_cleanup_synchronize,
+            "xgb_use_dmatrix": xgb_use_dmatrix,
+            "ft_cleanup_per_fold": ft_cleanup_per_fold,
+            "ft_cleanup_synchronize": ft_cleanup_synchronize,
+            "resn_cleanup_per_fold": resn_cleanup_per_fold,
+            "resn_cleanup_synchronize": resn_cleanup_synchronize,
+            "gnn_cleanup_per_fold": gnn_cleanup_per_fold,
+            "gnn_cleanup_synchronize": gnn_cleanup_synchronize,
+            "optuna_cleanup_synchronize": optuna_cleanup_synchronize,
             "optuna_storage": f"{output_dir}/optuna/bayesopt.sqlite3",
             "stack_model_keys": model_keys,
         })

ins_pricing/frontend/example_config.json CHANGED Viewed

@@ -26,6 +26,17 @@
   "use_gpu": true,
   "xgb_max_depth_max": 25,
   "xgb_n_estimators_max": 500,
+  "xgb_gpu_id": 0,
+  "xgb_cleanup_per_fold": false,
+  "xgb_cleanup_synchronize": false,
+  "xgb_use_dmatrix": true,
+  "ft_cleanup_per_fold": false,
+  "ft_cleanup_synchronize": false,
+  "resn_cleanup_per_fold": false,
+  "resn_cleanup_synchronize": false,
+  "gnn_cleanup_per_fold": false,
+  "gnn_cleanup_synchronize": false,
+  "optuna_cleanup_synchronize": false,
   "optuna_storage": "./Results/optuna/bayesopt.sqlite3",
   "runner": {
     "mode": "entry",

ins_pricing/frontend/example_workflows.py CHANGED Viewed

@@ -19,7 +19,7 @@ from ins_pricing.modelling.plotting import (
     plot_oneway,
 )
 from ins_pricing.modelling.plotting.common import finalize_figure, plt
-from ins_pricing.production.predict import load_predictor_from_config
+from ins_pricing.production.inference import load_predictor_from_config
 def _parse_csv_list(value: str) -> List[str]:

ins-pricing 0.4.5__py3-none-any.whl → 0.5.1__py3-none-any.whl

ins-pricing 0.4.5py3-none-any.whl → 0.5.1py3-none-any.whl