wavetrainer 0.1.6__tar.gz → 0.1.8__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {wavetrainer-0.1.6/wavetrainer.egg-info → wavetrainer-0.1.8}/PKG-INFO +1 -1
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/setup.py +1 -1
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/__init__.py +1 -1
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/create.py +2 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/catboost/catboost_model.py +1 -1
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/model_router.py +10 -2
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/pca_reducer.py +1 -1
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/trainer.py +5 -3
- {wavetrainer-0.1.6 → wavetrainer-0.1.8/wavetrainer.egg-info}/PKG-INFO +1 -1
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/LICENSE +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/MANIFEST.in +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/README.md +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/requirements.txt +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/setup.cfg +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/tests/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/tests/model/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/tests/model/catboost_kwargs_test.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/tests/trainer_test.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/calibrator/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/calibrator/calibrator.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/calibrator/calibrator_router.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/calibrator/vennabers_calibrator.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/exceptions.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/fit.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/catboost/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/catboost/catboost_classifier_wrap.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/catboost/catboost_kwargs.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/catboost/catboost_regressor_wrap.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/model.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/tabpfn/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/tabpfn/tabpfn_model.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/xgboost/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/xgboost/early_stopper.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/xgboost/xgboost_logger.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/xgboost/xgboost_model.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model_type.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/params.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/base_selector_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/combined_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/constant_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/correlation_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/duplicate_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/non_categorical_numeric_columns.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/nonnumeric_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/select_by_single_feature_performance_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/smart_correlation_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/unseen_reducer.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/selector/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/selector/selector.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/class_weights.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/combined_weights.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/exponential_weights.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/linear_weights.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/noop_weights.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/sigmoid_weights.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/weights.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/weights/weights_router.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/windower/__init__.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/windower/windower.py +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer.egg-info/SOURCES.txt +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer.egg-info/dependency_links.txt +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer.egg-info/not-zip-safe +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer.egg-info/requires.txt +0 -0
- {wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer.egg-info/top_level.txt +0 -0
@@ -23,7 +23,7 @@ def install_requires() -> typing.List[str]:
|
|
23
23
|
|
24
24
|
setup(
|
25
25
|
name='wavetrainer',
|
26
|
-
version='0.1.
|
26
|
+
version='0.1.8',
|
27
27
|
description='A library for automatically finding the optimal model within feature and hyperparameter space.',
|
28
28
|
long_description=long_description,
|
29
29
|
long_description_content_type='text/markdown',
|
@@ -16,6 +16,7 @@ def create(
|
|
16
16
|
max_train_timeout: datetime.timedelta | None = None,
|
17
17
|
cutoff_dt: datetime.datetime | None = None,
|
18
18
|
embedding_cols: list[list[str]] | None = None,
|
19
|
+
allowed_models: set[str] | None = None,
|
19
20
|
) -> Trainer:
|
20
21
|
"""Create a trainer."""
|
21
22
|
return Trainer(
|
@@ -27,4 +28,5 @@ def create(
|
|
27
28
|
max_train_timeout=max_train_timeout,
|
28
29
|
cutoff_dt=cutoff_dt,
|
29
30
|
embedding_cols=embedding_cols,
|
31
|
+
allowed_models=allowed_models,
|
30
32
|
)
|
@@ -123,7 +123,7 @@ class CatboostModel(Model):
|
|
123
123
|
self._early_stopping_rounds = trial.suggest_int(_EARLY_STOPPING_ROUNDS, 10, 500)
|
124
124
|
self._best_iteration = trial.user_attrs.get(_BEST_ITERATION_KEY)
|
125
125
|
loss_functions = [_DEFAULT_LOSS_FUNCTION]
|
126
|
-
if torch.cuda.is_available():
|
126
|
+
if not torch.cuda.is_available():
|
127
127
|
loss_functions.append(_FOCALLOSS_LOSS_FUNCTION)
|
128
128
|
loss_function = trial.suggest_categorical(_LOSS_FUNCTION_KEY, loss_functions)
|
129
129
|
self._loss_function = loss_function
|
@@ -33,10 +33,13 @@ class ModelRouter(Model):
|
|
33
33
|
_model: Model | None
|
34
34
|
_false_positive_reduction_steps: int | None
|
35
35
|
|
36
|
-
def __init__(self) -> None:
|
36
|
+
def __init__(self, allowed_models: set[str] | None) -> None:
|
37
37
|
super().__init__()
|
38
38
|
self._model = None
|
39
39
|
self._false_positive_reduction_steps = None
|
40
|
+
self._allowed_models = (
|
41
|
+
allowed_models if allowed_models is not None else set(_MODELS.keys())
|
42
|
+
)
|
40
43
|
|
41
44
|
@classmethod
|
42
45
|
def name(cls) -> str:
|
@@ -91,7 +94,12 @@ class ModelRouter(Model):
|
|
91
94
|
_FALSE_POSITIVE_REDUCTION_STEPS_KEY, 0, 5
|
92
95
|
)
|
93
96
|
model_name = trial.suggest_categorical(
|
94
|
-
"model",
|
97
|
+
"model",
|
98
|
+
[
|
99
|
+
k
|
100
|
+
for k, v in _MODELS.items()
|
101
|
+
if v.supports_x(df) and k in self._allowed_models
|
102
|
+
],
|
95
103
|
)
|
96
104
|
print(f"Using {model_name} model")
|
97
105
|
model = _MODELS[model_name]()
|
@@ -72,7 +72,7 @@ class PCAReducer(Reducer):
|
|
72
72
|
for k, v in self._pcas.items():
|
73
73
|
cols = self._embedding_dict[k]
|
74
74
|
compressed_embedding = v.transform(df[cols].fillna(0.0))
|
75
|
-
embedding_len = compressed_embedding.shape[
|
75
|
+
embedding_len = compressed_embedding.shape[1]
|
76
76
|
df[cols[:embedding_len]] = compressed_embedding
|
77
77
|
df = df.drop(columns=cols[embedding_len:])
|
78
78
|
return df
|
@@ -64,6 +64,7 @@ class Trainer(Fit):
|
|
64
64
|
max_train_timeout: datetime.timedelta | None = None,
|
65
65
|
cutoff_dt: datetime.datetime | None = None,
|
66
66
|
embedding_cols: list[list[str]] | None = None,
|
67
|
+
allowed_models: set[str] | None = None,
|
67
68
|
):
|
68
69
|
tqdm.tqdm.pandas()
|
69
70
|
|
@@ -155,6 +156,7 @@ class Trainer(Fit):
|
|
155
156
|
self._max_train_timeout = max_train_timeout
|
156
157
|
self._cutoff_dt = cutoff_dt
|
157
158
|
self.embedding_cols = embedding_cols
|
159
|
+
self._allowed_models = allowed_models
|
158
160
|
|
159
161
|
def _provide_study(self, column: str) -> optuna.Study:
|
160
162
|
storage_name = f"sqlite:///{self._folder}/{column}/{_STUDYDB_FILENAME}"
|
@@ -265,7 +267,7 @@ class Trainer(Fit):
|
|
265
267
|
print(f"Row weights took {time.time() - start_row_weights}")
|
266
268
|
|
267
269
|
# Create model
|
268
|
-
model = ModelRouter()
|
270
|
+
model = ModelRouter(self._allowed_models)
|
269
271
|
model.set_options(trial, x)
|
270
272
|
|
271
273
|
# Train
|
@@ -517,7 +519,7 @@ class Trainer(Fit):
|
|
517
519
|
reducer = CombinedReducer(self.embedding_cols)
|
518
520
|
reducer.load(folder)
|
519
521
|
|
520
|
-
model = ModelRouter()
|
522
|
+
model = ModelRouter(None)
|
521
523
|
model.load(folder)
|
522
524
|
|
523
525
|
selector = Selector(model)
|
@@ -570,7 +572,7 @@ class Trainer(Fit):
|
|
570
572
|
if not os.path.isdir(date_path):
|
571
573
|
continue
|
572
574
|
try:
|
573
|
-
model = ModelRouter()
|
575
|
+
model = ModelRouter(None)
|
574
576
|
model.load(date_path)
|
575
577
|
feature_importances[date_str] = model.feature_importances
|
576
578
|
except FileNotFoundError as exc:
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/catboost/catboost_classifier_wrap.py
RENAMED
File without changes
|
File without changes
|
{wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/model/catboost/catboost_regressor_wrap.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{wavetrainer-0.1.6 → wavetrainer-0.1.8}/wavetrainer/reducer/non_categorical_numeric_columns.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|