ins-pricing 0.4.5__py3-none-any.whl → 0.5.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (84) hide show
  1. ins_pricing/README.md +48 -22
  2. ins_pricing/__init__.py +142 -90
  3. ins_pricing/cli/BayesOpt_entry.py +52 -50
  4. ins_pricing/cli/BayesOpt_incremental.py +39 -105
  5. ins_pricing/cli/Explain_Run.py +31 -23
  6. ins_pricing/cli/Explain_entry.py +532 -579
  7. ins_pricing/cli/Pricing_Run.py +31 -23
  8. ins_pricing/cli/bayesopt_entry_runner.py +11 -9
  9. ins_pricing/cli/utils/cli_common.py +256 -256
  10. ins_pricing/cli/utils/cli_config.py +375 -375
  11. ins_pricing/cli/utils/import_resolver.py +382 -365
  12. ins_pricing/cli/utils/notebook_utils.py +340 -340
  13. ins_pricing/cli/watchdog_run.py +209 -201
  14. ins_pricing/frontend/__init__.py +10 -10
  15. ins_pricing/frontend/example_workflows.py +1 -1
  16. ins_pricing/governance/__init__.py +20 -20
  17. ins_pricing/governance/release.py +159 -159
  18. ins_pricing/modelling/__init__.py +147 -92
  19. ins_pricing/modelling/{core/bayesopt → bayesopt}/README.md +2 -2
  20. ins_pricing/modelling/{core/bayesopt → bayesopt}/__init__.py +64 -102
  21. ins_pricing/modelling/{core/bayesopt → bayesopt}/config_preprocess.py +562 -562
  22. ins_pricing/modelling/{core/bayesopt → bayesopt}/core.py +965 -964
  23. ins_pricing/modelling/{core/bayesopt → bayesopt}/model_explain_mixin.py +296 -296
  24. ins_pricing/modelling/{core/bayesopt → bayesopt}/model_plotting_mixin.py +482 -548
  25. ins_pricing/modelling/{core/bayesopt → bayesopt}/models/__init__.py +27 -27
  26. ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_ft_trainer.py +915 -913
  27. ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_gnn.py +788 -785
  28. ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_resn.py +448 -446
  29. ins_pricing/modelling/bayesopt/trainers/__init__.py +19 -0
  30. ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_base.py +1308 -1308
  31. ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_ft.py +3 -3
  32. ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_glm.py +197 -198
  33. ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_gnn.py +344 -344
  34. ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_resn.py +283 -283
  35. ins_pricing/modelling/{core/bayesopt → bayesopt}/trainers/trainer_xgb.py +346 -347
  36. ins_pricing/modelling/bayesopt/utils/__init__.py +67 -0
  37. ins_pricing/modelling/bayesopt/utils/constants.py +21 -0
  38. ins_pricing/modelling/bayesopt/utils/io_utils.py +7 -0
  39. ins_pricing/modelling/bayesopt/utils/losses.py +27 -0
  40. ins_pricing/modelling/bayesopt/utils/metrics_and_devices.py +17 -0
  41. ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/torch_trainer_mixin.py +623 -623
  42. ins_pricing/modelling/{core/evaluation.py → evaluation.py} +113 -104
  43. ins_pricing/modelling/explain/__init__.py +55 -55
  44. ins_pricing/modelling/explain/metrics.py +27 -174
  45. ins_pricing/modelling/explain/permutation.py +237 -237
  46. ins_pricing/modelling/plotting/__init__.py +40 -36
  47. ins_pricing/modelling/plotting/compat.py +228 -0
  48. ins_pricing/modelling/plotting/curves.py +572 -572
  49. ins_pricing/modelling/plotting/diagnostics.py +163 -163
  50. ins_pricing/modelling/plotting/geo.py +362 -362
  51. ins_pricing/modelling/plotting/importance.py +121 -121
  52. ins_pricing/pricing/__init__.py +27 -27
  53. ins_pricing/production/__init__.py +35 -25
  54. ins_pricing/production/{predict.py → inference.py} +140 -57
  55. ins_pricing/production/monitoring.py +8 -21
  56. ins_pricing/reporting/__init__.py +11 -11
  57. ins_pricing/setup.py +1 -1
  58. ins_pricing/tests/production/test_inference.py +90 -0
  59. ins_pricing/utils/__init__.py +116 -83
  60. ins_pricing/utils/device.py +255 -255
  61. ins_pricing/utils/features.py +53 -0
  62. ins_pricing/utils/io.py +72 -0
  63. ins_pricing/{modelling/core/bayesopt/utils → utils}/losses.py +125 -129
  64. ins_pricing/utils/metrics.py +158 -24
  65. ins_pricing/utils/numerics.py +76 -0
  66. ins_pricing/utils/paths.py +9 -1
  67. {ins_pricing-0.4.5.dist-info → ins_pricing-0.5.0.dist-info}/METADATA +182 -182
  68. ins_pricing-0.5.0.dist-info/RECORD +131 -0
  69. ins_pricing/modelling/core/BayesOpt.py +0 -146
  70. ins_pricing/modelling/core/__init__.py +0 -1
  71. ins_pricing/modelling/core/bayesopt/trainers/__init__.py +0 -19
  72. ins_pricing/modelling/core/bayesopt/utils/__init__.py +0 -86
  73. ins_pricing/modelling/core/bayesopt/utils/constants.py +0 -183
  74. ins_pricing/modelling/core/bayesopt/utils/io_utils.py +0 -126
  75. ins_pricing/modelling/core/bayesopt/utils/metrics_and_devices.py +0 -555
  76. ins_pricing/modelling/core/bayesopt/utils.py +0 -105
  77. ins_pricing/modelling/core/bayesopt/utils_backup.py +0 -1503
  78. ins_pricing/tests/production/test_predict.py +0 -233
  79. ins_pricing-0.4.5.dist-info/RECORD +0 -130
  80. /ins_pricing/modelling/{core/bayesopt → bayesopt}/config_components.py +0 -0
  81. /ins_pricing/modelling/{core/bayesopt → bayesopt}/models/model_ft_components.py +0 -0
  82. /ins_pricing/modelling/{core/bayesopt → bayesopt}/utils/distributed_utils.py +0 -0
  83. {ins_pricing-0.4.5.dist-info → ins_pricing-0.5.0.dist-info}/WHEEL +0 -0
  84. {ins_pricing-0.4.5.dist-info → ins_pricing-0.5.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,228 @@
1
+ from __future__ import annotations
2
+
3
+ from typing import Iterable, List, Mapping, Optional, Sequence, Tuple
4
+
5
+ import numpy as np
6
+ import pandas as pd
7
+
8
+ from ins_pricing.modelling.plotting.common import PlotStyle, plt
9
+ from ins_pricing.modelling.plotting.curves import (
10
+ plot_double_lift_curve,
11
+ plot_lift_curve,
12
+ )
13
+
14
+
15
+ def _safe_tag(value: str) -> str:
16
+ return "".join(ch if ch.isalnum() or ch in "-_." else "_" for ch in str(value))
17
+
18
+
19
+ def _to_array(values: Sequence[float], name: str) -> np.ndarray:
20
+ if values is None:
21
+ raise ValueError(f"{name} is required.")
22
+ return np.asarray(values, dtype=float).reshape(-1)
23
+
24
+
25
+ def _resolve_pred_pairs_from_df(
26
+ df: pd.DataFrame,
27
+ pred_cols: Optional[Sequence[str] | Mapping[str, object]],
28
+ pred_labels: Optional[Sequence[str]],
29
+ ) -> List[Tuple[str, np.ndarray]]:
30
+ if pred_cols is None:
31
+ raise ValueError("pred_cols is required when data is a DataFrame.")
32
+
33
+ pairs: List[Tuple[str, np.ndarray]] = []
34
+ if isinstance(pred_cols, Mapping):
35
+ for label, col in pred_cols.items():
36
+ if isinstance(col, str) and col in df.columns:
37
+ arr = df[col].to_numpy()
38
+ else:
39
+ arr = np.asarray(col, dtype=float).reshape(-1)
40
+ pairs.append((str(label), arr))
41
+ return pairs
42
+
43
+ if isinstance(pred_cols, str):
44
+ label = pred_cols if not pred_labels else str(pred_labels[0])
45
+ return [(label, df[pred_cols].to_numpy())]
46
+
47
+ labels = list(pred_labels) if pred_labels else [str(c) for c in pred_cols]
48
+ for col, label in zip(pred_cols, labels):
49
+ if isinstance(col, str) and col in df.columns:
50
+ arr = df[col].to_numpy()
51
+ else:
52
+ arr = np.asarray(col, dtype=float).reshape(-1)
53
+ pairs.append((str(label), arr))
54
+ return pairs
55
+
56
+
57
+ def _resolve_pred_pairs_from_arrays(
58
+ preds: object,
59
+ pred_labels: Optional[Sequence[str]],
60
+ ) -> List[Tuple[str, np.ndarray]]:
61
+ if isinstance(preds, Mapping):
62
+ return [(str(k), np.asarray(v, dtype=float).reshape(-1)) for k, v in preds.items()]
63
+
64
+ if isinstance(preds, (list, tuple)):
65
+ labels = list(pred_labels) if pred_labels else [f"model_{idx + 1}" for idx in range(len(preds))]
66
+ return [
67
+ (str(label), np.asarray(arr, dtype=float).reshape(-1))
68
+ for label, arr in zip(labels, preds)
69
+ ]
70
+
71
+ return [("model_1", np.asarray(preds, dtype=float).reshape(-1))]
72
+
73
+
74
+ def plot_lift_list(
75
+ data_or_preds: pd.DataFrame | Mapping[str, object] | Sequence[object],
76
+ pred_cols: Optional[Sequence[str] | Mapping[str, object]] = None,
77
+ actual: Optional[Sequence[float]] = None,
78
+ weight: Optional[Sequence[float]] = None,
79
+ *,
80
+ actual_col: str = "w_act",
81
+ weight_col: str = "weight",
82
+ pred_labels: Optional[Sequence[str]] = None,
83
+ n_bins: int = 10,
84
+ pred_weighted: bool = False,
85
+ actual_weighted: bool = True,
86
+ show: bool = False,
87
+ save_dir: Optional[str] = None,
88
+ filename_prefix: str = "lift",
89
+ style: Optional[PlotStyle] = None,
90
+ ) -> List[plt.Figure]:
91
+ """Compatibility helper: plot multiple lift curves in one call."""
92
+ if isinstance(data_or_preds, pd.DataFrame):
93
+ df = data_or_preds
94
+ pairs = _resolve_pred_pairs_from_df(df, pred_cols, pred_labels)
95
+ actual_arr = _to_array(df[actual_col], actual_col) if actual is None else _to_array(actual, "actual")
96
+ weight_arr = None
97
+ if weight is not None:
98
+ weight_arr = _to_array(weight, "weight")
99
+ elif weight_col in df.columns:
100
+ weight_arr = _to_array(df[weight_col], weight_col)
101
+ else:
102
+ pairs = _resolve_pred_pairs_from_arrays(data_or_preds, pred_labels)
103
+ actual_arr = _to_array(actual, "actual")
104
+ weight_arr = _to_array(weight, "weight") if weight is not None else None
105
+
106
+ figs: List[plt.Figure] = []
107
+ for label, pred in pairs:
108
+ save_path = None
109
+ if save_dir:
110
+ safe_dir = save_dir.rstrip("/\\")
111
+ save_path = f"{safe_dir}/{filename_prefix}_{_safe_tag(label)}.png"
112
+ fig = plot_lift_curve(
113
+ pred,
114
+ actual_arr,
115
+ weight_arr,
116
+ n_bins=n_bins,
117
+ title=f"{label} Lift Chart",
118
+ pred_label="Predicted",
119
+ act_label="Actual",
120
+ weight_label="Earned Exposure",
121
+ pred_weighted=pred_weighted,
122
+ actual_weighted=actual_weighted,
123
+ show=show,
124
+ save_path=save_path,
125
+ style=style,
126
+ )
127
+ figs.append(fig)
128
+ return figs
129
+
130
+
131
+ def plot_dlift_list(
132
+ data_or_preds: pd.DataFrame | Mapping[str, object] | Sequence[object],
133
+ pred_cols: Optional[Sequence[str] | Mapping[str, object]] = None,
134
+ actual: Optional[Sequence[float]] = None,
135
+ weight: Optional[Sequence[float]] = None,
136
+ *,
137
+ actual_col: str = "w_act",
138
+ weight_col: str = "weight",
139
+ pred_labels: Optional[Sequence[str]] = None,
140
+ pairs: Optional[Iterable[Tuple[object, object]]] = None,
141
+ n_bins: int = 10,
142
+ pred_weighted: bool = False,
143
+ actual_weighted: bool = True,
144
+ show: bool = False,
145
+ save_dir: Optional[str] = None,
146
+ filename_prefix: str = "double_lift",
147
+ style: Optional[PlotStyle] = None,
148
+ ) -> List[plt.Figure]:
149
+ """Compatibility helper: plot double-lift curves for multiple model pairs."""
150
+ if isinstance(data_or_preds, pd.DataFrame):
151
+ df = data_or_preds
152
+ pairs_list = _resolve_pred_pairs_from_df(df, pred_cols, pred_labels)
153
+ actual_arr = _to_array(df[actual_col], actual_col) if actual is None else _to_array(actual, "actual")
154
+ weight_arr = None
155
+ if weight is not None:
156
+ weight_arr = _to_array(weight, "weight")
157
+ elif weight_col in df.columns:
158
+ weight_arr = _to_array(df[weight_col], weight_col)
159
+ else:
160
+ pairs_list = _resolve_pred_pairs_from_arrays(data_or_preds, pred_labels)
161
+ actual_arr = _to_array(actual, "actual")
162
+ weight_arr = _to_array(weight, "weight") if weight is not None else None
163
+
164
+ pred_map = {label: arr for label, arr in pairs_list}
165
+ labels = [label for label, _ in pairs_list]
166
+
167
+ pair_labels: List[Tuple[str, str]] = []
168
+ if pairs is None:
169
+ for idx, first in enumerate(labels):
170
+ for second in labels[idx + 1 :]:
171
+ pair_labels.append((first, second))
172
+ else:
173
+ for left, right in pairs:
174
+ if isinstance(left, int):
175
+ left_label = labels[left]
176
+ else:
177
+ left_label = str(left)
178
+ if isinstance(right, int):
179
+ right_label = labels[right]
180
+ else:
181
+ right_label = str(right)
182
+ pair_labels.append((left_label, right_label))
183
+
184
+ figs: List[plt.Figure] = []
185
+ for label1, label2 in pair_labels:
186
+ pred1 = pred_map.get(label1)
187
+ pred2 = pred_map.get(label2)
188
+ if pred1 is None or pred2 is None:
189
+ continue
190
+ save_path = None
191
+ if save_dir:
192
+ safe_dir = save_dir.rstrip("/\\")
193
+ tag = f"{_safe_tag(label1)}_vs_{_safe_tag(label2)}"
194
+ save_path = f"{safe_dir}/{filename_prefix}_{tag}.png"
195
+ fig = plot_double_lift_curve(
196
+ pred1,
197
+ pred2,
198
+ actual_arr,
199
+ weight_arr,
200
+ n_bins=n_bins,
201
+ title=f"Double Lift: {label1} vs {label2}",
202
+ label1=label1,
203
+ label2=label2,
204
+ pred1_weighted=pred_weighted,
205
+ pred2_weighted=pred_weighted,
206
+ actual_weighted=actual_weighted,
207
+ show=show,
208
+ save_path=save_path,
209
+ style=style,
210
+ )
211
+ figs.append(fig)
212
+ return figs
213
+
214
+
215
+ class PlotUtils:
216
+ """Compatibility wrapper for legacy plotting helpers."""
217
+
218
+ plot_lift_curve = staticmethod(plot_lift_curve)
219
+ plot_double_lift_curve = staticmethod(plot_double_lift_curve)
220
+ plot_lift_list = staticmethod(plot_lift_list)
221
+ plot_dlift_list = staticmethod(plot_dlift_list)
222
+
223
+
224
+ __all__ = [
225
+ "PlotUtils",
226
+ "plot_lift_list",
227
+ "plot_dlift_list",
228
+ ]