upgini 1.2.9a1__py3-none-any.whl → 1.2.9a3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- upgini/__about__.py +1 -1
- upgini/__init__.py +2 -2
- upgini/features_enricher.py +2 -2
- upgini/metrics.py +1 -1
- upgini/utils/features_validator.py +3 -2
- {upgini-1.2.9a1.dist-info → upgini-1.2.9a3.dist-info}/METADATA +1 -2
- {upgini-1.2.9a1.dist-info → upgini-1.2.9a3.dist-info}/RECORD +9 -9
- {upgini-1.2.9a1.dist-info → upgini-1.2.9a3.dist-info}/WHEEL +0 -0
- {upgini-1.2.9a1.dist-info → upgini-1.2.9a3.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "1.2.
|
|
1
|
+
__version__ = "1.2.9a3"
|
upgini/__init__.py
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
import os
|
|
2
2
|
|
|
3
|
-
|
|
4
|
-
|
|
3
|
+
from upgini.features_enricher import FeaturesEnricher # noqa: F401
|
|
4
|
+
from upgini.metadata import SearchKey, CVType, RuntimeParameters, ModelTaskType # noqa: F401
|
|
5
5
|
# from .lazy_import import LazyImport
|
|
6
6
|
|
|
7
7
|
os.environ["SETUPTOOLS_USE_DISTUTILS"] = "stdlib"
|
upgini/features_enricher.py
CHANGED
|
@@ -2531,7 +2531,7 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
2531
2531
|
features_columns = [c for c in df.columns if c not in non_feature_columns]
|
|
2532
2532
|
|
|
2533
2533
|
features_to_drop = FeaturesValidator(self.logger).validate(
|
|
2534
|
-
df, features_columns, self.generate_features, self.warning_counter
|
|
2534
|
+
df, features_columns, self.generate_features, columns_renaming, self.warning_counter
|
|
2535
2535
|
)
|
|
2536
2536
|
self.fit_dropped_features.update(features_to_drop)
|
|
2537
2537
|
df = df.drop(columns=features_to_drop)
|
|
@@ -2657,7 +2657,7 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
2657
2657
|
and len(self._search_task.unused_features_for_generation) > 0
|
|
2658
2658
|
):
|
|
2659
2659
|
unused_features_for_generation = [
|
|
2660
|
-
|
|
2660
|
+
columns_renaming.get(col) or col for col in self._search_task.unused_features_for_generation
|
|
2661
2661
|
]
|
|
2662
2662
|
msg = self.bundle.get("features_not_generated").format(unused_features_for_generation)
|
|
2663
2663
|
self.logger.warning(msg)
|
upgini/metrics.py
CHANGED
|
@@ -10,7 +10,6 @@ import catboost
|
|
|
10
10
|
import numpy as np
|
|
11
11
|
import pandas as pd
|
|
12
12
|
from catboost import CatBoostClassifier, CatBoostRegressor
|
|
13
|
-
from lightgbm import LGBMClassifier, LGBMRegressor
|
|
14
13
|
from numpy import log1p
|
|
15
14
|
from pandas.api.types import is_numeric_dtype
|
|
16
15
|
from sklearn.metrics import check_scoring, get_scorer, make_scorer, roc_auc_score
|
|
@@ -406,6 +405,7 @@ class EstimatorWrapper:
|
|
|
406
405
|
estimator = CatBoostWrapper(**kwargs)
|
|
407
406
|
else:
|
|
408
407
|
try:
|
|
408
|
+
from lightgbm import LGBMClassifier, LGBMRegressor
|
|
409
409
|
if isinstance(estimator, (LGBMClassifier, LGBMRegressor)):
|
|
410
410
|
estimator = LightGBMWrapper(**kwargs)
|
|
411
411
|
else:
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
import logging
|
|
2
2
|
from logging import Logger
|
|
3
|
-
from typing import List, Optional
|
|
3
|
+
from typing import Dict, List, Optional
|
|
4
4
|
|
|
5
5
|
import pandas as pd
|
|
6
6
|
from pandas.api.types import is_integer_dtype, is_object_dtype, is_string_dtype
|
|
@@ -22,6 +22,7 @@ class FeaturesValidator:
|
|
|
22
22
|
df: pd.DataFrame,
|
|
23
23
|
features: List[str],
|
|
24
24
|
features_for_generate: Optional[List[str]],
|
|
25
|
+
columns_renaming: Dict[str, str],
|
|
25
26
|
warning_counter: WarningCounter,
|
|
26
27
|
) -> List[str]:
|
|
27
28
|
# one_hot_encoded_features = []
|
|
@@ -63,7 +64,7 @@ class FeaturesValidator:
|
|
|
63
64
|
|
|
64
65
|
high_cardinality_features = self.find_high_cardinality(df[features])
|
|
65
66
|
if features_for_generate:
|
|
66
|
-
high_cardinality_features = [f for f in high_cardinality_features if f not in features_for_generate]
|
|
67
|
+
high_cardinality_features = [f for f in high_cardinality_features if columns_renaming[f] not in features_for_generate]
|
|
67
68
|
if high_cardinality_features:
|
|
68
69
|
msg = bundle.get("high_cardinality_features").format(high_cardinality_features)
|
|
69
70
|
print(msg)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.3
|
|
2
2
|
Name: upgini
|
|
3
|
-
Version: 1.2.
|
|
3
|
+
Version: 1.2.9a3
|
|
4
4
|
Summary: Intelligent data search & enrichment for Machine Learning
|
|
5
5
|
Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
|
|
6
6
|
Project-URL: Homepage, https://upgini.com/
|
|
@@ -28,7 +28,6 @@ Requires-Dist: fastparquet>=0.8.1
|
|
|
28
28
|
Requires-Dist: ipywidgets>=8.1.0
|
|
29
29
|
Requires-Dist: jarowinkler>=2.0.0
|
|
30
30
|
Requires-Dist: levenshtein>=0.25.1
|
|
31
|
-
Requires-Dist: lightgbm>=3.3.2
|
|
32
31
|
Requires-Dist: numpy<=1.26.4,>=1.19.0
|
|
33
32
|
Requires-Dist: pandas<3.0.0,>=1.1.0
|
|
34
33
|
Requires-Dist: pydantic<3.0.0,>1.0.0
|
|
@@ -1,13 +1,13 @@
|
|
|
1
|
-
upgini/__about__.py,sha256=
|
|
2
|
-
upgini/__init__.py,sha256=
|
|
1
|
+
upgini/__about__.py,sha256=r3QIbFOSJMAs6ONA-HrOMmqgGlWw7zq9CfF__Tf43EE,24
|
|
2
|
+
upgini/__init__.py,sha256=M64LwQTBa-5Jz24Zm2h8rWwlKQQ1J8nP7gGgIciS0WU,589
|
|
3
3
|
upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
|
|
4
4
|
upgini/dataset.py,sha256=olZ-OHSfBNoBSCo7R5t7uCLukI2nO7afpx_A-HCiJLk,31067
|
|
5
5
|
upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
|
|
6
|
-
upgini/features_enricher.py,sha256=
|
|
6
|
+
upgini/features_enricher.py,sha256=cnNZ5e_uyU5f3cHumeeVBI1PZFn3DKcuTNBz0XRCEDU,188144
|
|
7
7
|
upgini/http.py,sha256=21asexflvavydzCOONJDGQBtQanCElrbnqLXakJ9Cu8,42880
|
|
8
8
|
upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
|
|
9
9
|
upgini/metadata.py,sha256=osmzdNESeh7yP3BZday6N9Q3eaIHfzhhRM1d6NSgcf0,11223
|
|
10
|
-
upgini/metrics.py,sha256=
|
|
10
|
+
upgini/metrics.py,sha256=AYVvcqSqO_UWwFIby0gcqSDNLiIoy6EU3pa8aUBUQ4k,30946
|
|
11
11
|
upgini/search_task.py,sha256=qxUxAD-bed-FpZYmTB_4orW7YJsW_O6a1TcgnZIRFr4,17307
|
|
12
12
|
upgini/spinner.py,sha256=4iMd-eIe_BnkqFEMIliULTbj6rNI2HkN_VJ4qYe0cUc,1118
|
|
13
13
|
upgini/version_validator.py,sha256=ddSKUK_-eGJB3NgrqOMoWJU-OxQ253WsNLp8aqJkaIM,1389
|
|
@@ -47,7 +47,7 @@ upgini/utils/deduplicate_utils.py,sha256=Zvs7zW4QzaERQmJNPrTVf2ZTVBkBLOycFCzyMwt
|
|
|
47
47
|
upgini/utils/display_utils.py,sha256=A2ouB5eiZ-Kyt9ykYxkLQwyoRPrdYeJymwNTiajtFXs,10990
|
|
48
48
|
upgini/utils/email_utils.py,sha256=j0Ug1R_0AnCg1Y92zIZ4XMwvKo3G5_pcOlBN1OH_gZs,5191
|
|
49
49
|
upgini/utils/fallback_progress_bar.py,sha256=PDaKb8dYpVZaWMroNcOHsTc3pSjgi9mOm0--cOFTwJ0,1074
|
|
50
|
-
upgini/utils/features_validator.py,sha256=
|
|
50
|
+
upgini/utils/features_validator.py,sha256=Vu-zQ-QoxDG0tQfkqQy_il9dQDkyiZadKBpr6izKAe0,3373
|
|
51
51
|
upgini/utils/format.py,sha256=Yv5cvvSs2bOLUzzNu96Pu33VMDNbabio92QepUj41jU,243
|
|
52
52
|
upgini/utils/ip_utils.py,sha256=Q6vb7Sr5Khx3Sq3eENjW2qCXKej_S5jZbneH6zEOkzQ,5171
|
|
53
53
|
upgini/utils/phone_utils.py,sha256=IrbztLuOJBiePqqxllfABWfYlfAjYevPhXKipl95wUI,10432
|
|
@@ -57,7 +57,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
|
|
|
57
57
|
upgini/utils/target_utils.py,sha256=BVtDmrmFMKerSUWaNOIEdzsYHIFiODdpnWbE50QDPDc,7864
|
|
58
58
|
upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
|
|
59
59
|
upgini/utils/warning_counter.py,sha256=dIWBB4dI5XRRJZudvIlqlIYKEiwLLPcXarsZuYRt338,227
|
|
60
|
-
upgini-1.2.
|
|
61
|
-
upgini-1.2.
|
|
62
|
-
upgini-1.2.
|
|
63
|
-
upgini-1.2.
|
|
60
|
+
upgini-1.2.9a3.dist-info/METADATA,sha256=bpMUUAhh6v9AbRs2WD7Ns4PGK2kR61jPm8ITvr8-pwE,48578
|
|
61
|
+
upgini-1.2.9a3.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
|
|
62
|
+
upgini-1.2.9a3.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
|
|
63
|
+
upgini-1.2.9a3.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|