wavetrainer 0.0.50__tar.gz → 0.0.51__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {wavetrainer-0.0.50/wavetrainer.egg-info → wavetrainer-0.0.51}/PKG-INFO +1 -1
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/setup.py +1 -1
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/__init__.py +1 -1
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/model_router.py +52 -2
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/xgboost/xgboost_model.py +4 -1
- {wavetrainer-0.0.50 → wavetrainer-0.0.51/wavetrainer.egg-info}/PKG-INFO +1 -1
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/LICENSE +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/MANIFEST.in +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/README.md +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/requirements.txt +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/setup.cfg +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/tests/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/tests/model/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/tests/model/catboost_kwargs_test.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/tests/trainer_test.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/calibrator/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/calibrator/calibrator.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/calibrator/calibrator_router.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/calibrator/mapie_calibrator.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/calibrator/vennabers_calibrator.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/create.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/exceptions.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/fit.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/catboost/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/catboost/catboost_classifier_wrap.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/catboost/catboost_kwargs.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/catboost/catboost_model.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/catboost/catboost_regressor_wrap.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/model.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/tabpfn/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/tabpfn/tabpfn_model.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/xgboost/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/xgboost/early_stopper.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/xgboost/xgboost_logger.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model_type.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/params.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/base_selector_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/combined_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/constant_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/correlation_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/duplicate_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/non_categorical_numeric_columns.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/nonnumeric_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/pca_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/select_by_single_feature_performance_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/smart_correlation_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/unseen_reducer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/selector/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/selector/selector.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/trainer.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/class_weights.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/combined_weights.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/exponential_weights.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/linear_weights.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/noop_weights.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/sigmoid_weights.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/weights.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/weights/weights_router.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/windower/__init__.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/windower/windower.py +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer.egg-info/SOURCES.txt +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer.egg-info/dependency_links.txt +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer.egg-info/not-zip-safe +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer.egg-info/requires.txt +0 -0
- {wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer.egg-info/top_level.txt +0 -0
@@ -23,7 +23,7 @@ def install_requires() -> typing.List[str]:
|
|
23
23
|
|
24
24
|
setup(
|
25
25
|
name='wavetrainer',
|
26
|
-
version='0.0.
|
26
|
+
version='0.0.51',
|
27
27
|
description='A library for automatically finding the optimal model within feature and hyperparameter space.',
|
28
28
|
long_description=long_description,
|
29
29
|
long_description_content_type='text/markdown',
|
@@ -1,19 +1,23 @@
|
|
1
1
|
"""A model class that routes to other models."""
|
2
2
|
|
3
|
+
import functools
|
3
4
|
import json
|
4
5
|
import os
|
5
6
|
from typing import Self
|
6
7
|
|
7
8
|
import optuna
|
8
9
|
import pandas as pd
|
10
|
+
from sklearn.metrics import accuracy_score # type: ignore
|
9
11
|
|
12
|
+
from ..model_type import ModelType, determine_model_type
|
10
13
|
from .catboost.catboost_model import CatboostModel
|
11
|
-
from .model import Model
|
14
|
+
from .model import PREDICTION_COLUMN, PROBABILITY_COLUMN_PREFIX, Model
|
12
15
|
from .tabpfn.tabpfn_model import TabPFNModel
|
13
16
|
from .xgboost.xgboost_model import XGBoostModel
|
14
17
|
|
15
18
|
_MODEL_ROUTER_FILE = "model_router.json"
|
16
19
|
_MODEL_KEY = "model"
|
20
|
+
_FALSE_POSITIVE_REDUCTION_STEPS_KEY = "false_positive_reduction_steps"
|
17
21
|
_MODELS = {
|
18
22
|
CatboostModel.name(): CatboostModel,
|
19
23
|
TabPFNModel.name(): TabPFNModel,
|
@@ -27,10 +31,12 @@ class ModelRouter(Model):
|
|
27
31
|
# pylint: disable=too-many-positional-arguments,too-many-arguments
|
28
32
|
|
29
33
|
_model: Model | None
|
34
|
+
_false_positive_reduction_steps: int | None
|
30
35
|
|
31
36
|
def __init__(self) -> None:
|
32
37
|
super().__init__()
|
33
38
|
self._model = None
|
39
|
+
self._false_positive_reduction_steps = None
|
34
40
|
|
35
41
|
@classmethod
|
36
42
|
def name(cls) -> str:
|
@@ -81,6 +87,9 @@ class ModelRouter(Model):
|
|
81
87
|
def set_options(
|
82
88
|
self, trial: optuna.Trial | optuna.trial.FrozenTrial, df: pd.DataFrame
|
83
89
|
) -> None:
|
90
|
+
self._false_positive_reduction_steps = trial.suggest_int(
|
91
|
+
_FALSE_POSITIVE_REDUCTION_STEPS_KEY, 0, 5
|
92
|
+
)
|
84
93
|
model_name = trial.suggest_categorical(
|
85
94
|
"model", [k for k, v in _MODELS.items() if v.supports_x(df)]
|
86
95
|
)
|
@@ -122,7 +131,48 @@ class ModelRouter(Model):
|
|
122
131
|
model = self._model
|
123
132
|
if model is None:
|
124
133
|
raise ValueError("model is null")
|
125
|
-
|
134
|
+
false_positive_reduction_steps = self._false_positive_reduction_steps
|
135
|
+
if false_positive_reduction_steps is None:
|
136
|
+
false_positive_reduction_steps = 0
|
137
|
+
for i in range(max(false_positive_reduction_steps, 1)):
|
138
|
+
print(f"False Positive Reduction Step: {i + 1}")
|
139
|
+
pred = model.fit_transform(df, y=y, w=w, eval_x=eval_x, eval_y=eval_y)
|
140
|
+
if (
|
141
|
+
w is None
|
142
|
+
or y is None
|
143
|
+
or determine_model_type(y) == ModelType.REGRESSION
|
144
|
+
):
|
145
|
+
break
|
146
|
+
print(f"Accuracy: {accuracy_score(y, pred[PREDICTION_COLUMN])}")
|
147
|
+
pred["__wavetrain_correct"] = pred[PREDICTION_COLUMN] != y
|
148
|
+
pred["__wavetrain_error_weight"] = pred["__wavetrain_correct"].astype(float)
|
149
|
+
prob_columns = sorted(
|
150
|
+
[
|
151
|
+
x
|
152
|
+
for x in pred.columns.values.tolist()
|
153
|
+
if x.startswith(PROBABILITY_COLUMN_PREFIX)
|
154
|
+
]
|
155
|
+
)
|
156
|
+
if prob_columns:
|
157
|
+
|
158
|
+
def determine_error_weight(
|
159
|
+
row: pd.Series, prob_columns: list[str]
|
160
|
+
) -> float:
|
161
|
+
nonlocal y
|
162
|
+
if not row["__wavetrain_correct"]:
|
163
|
+
return abs(row[prob_columns[1 - int(y.loc[row.name])]]) # type: ignore
|
164
|
+
return 0.0
|
165
|
+
|
166
|
+
pred["__wavetrain_error_weight"] = pred.apply(
|
167
|
+
functools.partial(
|
168
|
+
determine_error_weight,
|
169
|
+
prob_columns=prob_columns,
|
170
|
+
),
|
171
|
+
axis=1,
|
172
|
+
)
|
173
|
+
w += pred["__wavetrain_error_weight"]
|
174
|
+
w = w.clip(lower=0.0)
|
175
|
+
|
126
176
|
return self
|
127
177
|
|
128
178
|
def transform(self, df: pd.DataFrame) -> pd.DataFrame:
|
@@ -125,7 +125,10 @@ class XGBoostModel(Model):
|
|
125
125
|
try:
|
126
126
|
score_dict = bst.get_booster().get_score(importance_type="weight") # type: ignore
|
127
127
|
total = sum(score_dict.values()) # type: ignore
|
128
|
-
return {
|
128
|
+
return {
|
129
|
+
k: 0.0 if total == 0.0 else v / total # type: ignore
|
130
|
+
for k, v in score_dict.items() # type: ignore
|
131
|
+
} # type: ignore
|
129
132
|
except XGBoostError as exc:
|
130
133
|
print(str(exc))
|
131
134
|
return {}
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/catboost/catboost_classifier_wrap.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
{wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/model/catboost/catboost_regressor_wrap.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{wavetrainer-0.0.50 → wavetrainer-0.0.51}/wavetrainer/reducer/non_categorical_numeric_columns.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|