upgini 1.2.9a1__py3-none-any.whl → 1.2.9a3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.9a1"
1
+ __version__ = "1.2.9a3"
upgini/__init__.py CHANGED
@@ -1,7 +1,7 @@
1
1
  import os
2
2
 
3
- # from upgini.features_enricher import FeaturesEnricher # noqa: F401
4
- # from upgini.metadata import SearchKey, CVType, RuntimeParameters, ModelTaskType # noqa: F401
3
+ from upgini.features_enricher import FeaturesEnricher # noqa: F401
4
+ from upgini.metadata import SearchKey, CVType, RuntimeParameters, ModelTaskType # noqa: F401
5
5
  # from .lazy_import import LazyImport
6
6
 
7
7
  os.environ["SETUPTOOLS_USE_DISTUTILS"] = "stdlib"
@@ -2531,7 +2531,7 @@ class FeaturesEnricher(TransformerMixin):
2531
2531
  features_columns = [c for c in df.columns if c not in non_feature_columns]
2532
2532
 
2533
2533
  features_to_drop = FeaturesValidator(self.logger).validate(
2534
- df, features_columns, self.generate_features, self.warning_counter
2534
+ df, features_columns, self.generate_features, columns_renaming, self.warning_counter
2535
2535
  )
2536
2536
  self.fit_dropped_features.update(features_to_drop)
2537
2537
  df = df.drop(columns=features_to_drop)
@@ -2657,7 +2657,7 @@ class FeaturesEnricher(TransformerMixin):
2657
2657
  and len(self._search_task.unused_features_for_generation) > 0
2658
2658
  ):
2659
2659
  unused_features_for_generation = [
2660
- dataset.columns_renaming.get(col) or col for col in self._search_task.unused_features_for_generation
2660
+ columns_renaming.get(col) or col for col in self._search_task.unused_features_for_generation
2661
2661
  ]
2662
2662
  msg = self.bundle.get("features_not_generated").format(unused_features_for_generation)
2663
2663
  self.logger.warning(msg)
upgini/metrics.py CHANGED
@@ -10,7 +10,6 @@ import catboost
10
10
  import numpy as np
11
11
  import pandas as pd
12
12
  from catboost import CatBoostClassifier, CatBoostRegressor
13
- from lightgbm import LGBMClassifier, LGBMRegressor
14
13
  from numpy import log1p
15
14
  from pandas.api.types import is_numeric_dtype
16
15
  from sklearn.metrics import check_scoring, get_scorer, make_scorer, roc_auc_score
@@ -406,6 +405,7 @@ class EstimatorWrapper:
406
405
  estimator = CatBoostWrapper(**kwargs)
407
406
  else:
408
407
  try:
408
+ from lightgbm import LGBMClassifier, LGBMRegressor
409
409
  if isinstance(estimator, (LGBMClassifier, LGBMRegressor)):
410
410
  estimator = LightGBMWrapper(**kwargs)
411
411
  else:
@@ -1,6 +1,6 @@
1
1
  import logging
2
2
  from logging import Logger
3
- from typing import List, Optional
3
+ from typing import Dict, List, Optional
4
4
 
5
5
  import pandas as pd
6
6
  from pandas.api.types import is_integer_dtype, is_object_dtype, is_string_dtype
@@ -22,6 +22,7 @@ class FeaturesValidator:
22
22
  df: pd.DataFrame,
23
23
  features: List[str],
24
24
  features_for_generate: Optional[List[str]],
25
+ columns_renaming: Dict[str, str],
25
26
  warning_counter: WarningCounter,
26
27
  ) -> List[str]:
27
28
  # one_hot_encoded_features = []
@@ -63,7 +64,7 @@ class FeaturesValidator:
63
64
 
64
65
  high_cardinality_features = self.find_high_cardinality(df[features])
65
66
  if features_for_generate:
66
- high_cardinality_features = [f for f in high_cardinality_features if f not in features_for_generate]
67
+ high_cardinality_features = [f for f in high_cardinality_features if columns_renaming[f] not in features_for_generate]
67
68
  if high_cardinality_features:
68
69
  msg = bundle.get("high_cardinality_features").format(high_cardinality_features)
69
70
  print(msg)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.9a1
3
+ Version: 1.2.9a3
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -28,7 +28,6 @@ Requires-Dist: fastparquet>=0.8.1
28
28
  Requires-Dist: ipywidgets>=8.1.0
29
29
  Requires-Dist: jarowinkler>=2.0.0
30
30
  Requires-Dist: levenshtein>=0.25.1
31
- Requires-Dist: lightgbm>=3.3.2
32
31
  Requires-Dist: numpy<=1.26.4,>=1.19.0
33
32
  Requires-Dist: pandas<3.0.0,>=1.1.0
34
33
  Requires-Dist: pydantic<3.0.0,>1.0.0
@@ -1,13 +1,13 @@
1
- upgini/__about__.py,sha256=7Gzi_eVq3ultTr1051v0KFVS_6MD6QhmeLycn0AEEm4,24
2
- upgini/__init__.py,sha256=3WLf0J2JF5xhTYOKbReBzkRmmvXTl_V7JKZm7b-cpTo,593
1
+ upgini/__about__.py,sha256=r3QIbFOSJMAs6ONA-HrOMmqgGlWw7zq9CfF__Tf43EE,24
2
+ upgini/__init__.py,sha256=M64LwQTBa-5Jz24Zm2h8rWwlKQQ1J8nP7gGgIciS0WU,589
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=olZ-OHSfBNoBSCo7R5t7uCLukI2nO7afpx_A-HCiJLk,31067
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=J5-bn07iaJSXVN8COeu2RbDqZ4NTPd1L27HePaNh52o,188134
6
+ upgini/features_enricher.py,sha256=cnNZ5e_uyU5f3cHumeeVBI1PZFn3DKcuTNBz0XRCEDU,188144
7
7
  upgini/http.py,sha256=21asexflvavydzCOONJDGQBtQanCElrbnqLXakJ9Cu8,42880
8
8
  upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
9
9
  upgini/metadata.py,sha256=osmzdNESeh7yP3BZday6N9Q3eaIHfzhhRM1d6NSgcf0,11223
10
- upgini/metrics.py,sha256=Tu5cN8RlhOSSMWUTXRSkdl8SWBqR1N_2eJpBum9pZxc,30926
10
+ upgini/metrics.py,sha256=AYVvcqSqO_UWwFIby0gcqSDNLiIoy6EU3pa8aUBUQ4k,30946
11
11
  upgini/search_task.py,sha256=qxUxAD-bed-FpZYmTB_4orW7YJsW_O6a1TcgnZIRFr4,17307
12
12
  upgini/spinner.py,sha256=4iMd-eIe_BnkqFEMIliULTbj6rNI2HkN_VJ4qYe0cUc,1118
13
13
  upgini/version_validator.py,sha256=ddSKUK_-eGJB3NgrqOMoWJU-OxQ253WsNLp8aqJkaIM,1389
@@ -47,7 +47,7 @@ upgini/utils/deduplicate_utils.py,sha256=Zvs7zW4QzaERQmJNPrTVf2ZTVBkBLOycFCzyMwt
47
47
  upgini/utils/display_utils.py,sha256=A2ouB5eiZ-Kyt9ykYxkLQwyoRPrdYeJymwNTiajtFXs,10990
48
48
  upgini/utils/email_utils.py,sha256=j0Ug1R_0AnCg1Y92zIZ4XMwvKo3G5_pcOlBN1OH_gZs,5191
49
49
  upgini/utils/fallback_progress_bar.py,sha256=PDaKb8dYpVZaWMroNcOHsTc3pSjgi9mOm0--cOFTwJ0,1074
50
- upgini/utils/features_validator.py,sha256=PgKNt5dyqfErTvjtRNNUS9g7GFqHBtAtnsfA-V5UO1A,3307
50
+ upgini/utils/features_validator.py,sha256=Vu-zQ-QoxDG0tQfkqQy_il9dQDkyiZadKBpr6izKAe0,3373
51
51
  upgini/utils/format.py,sha256=Yv5cvvSs2bOLUzzNu96Pu33VMDNbabio92QepUj41jU,243
52
52
  upgini/utils/ip_utils.py,sha256=Q6vb7Sr5Khx3Sq3eENjW2qCXKej_S5jZbneH6zEOkzQ,5171
53
53
  upgini/utils/phone_utils.py,sha256=IrbztLuOJBiePqqxllfABWfYlfAjYevPhXKipl95wUI,10432
@@ -57,7 +57,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
57
57
  upgini/utils/target_utils.py,sha256=BVtDmrmFMKerSUWaNOIEdzsYHIFiODdpnWbE50QDPDc,7864
58
58
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
59
59
  upgini/utils/warning_counter.py,sha256=dIWBB4dI5XRRJZudvIlqlIYKEiwLLPcXarsZuYRt338,227
60
- upgini-1.2.9a1.dist-info/METADATA,sha256=jA10qVCiAGbOFKn0gbV4t9V9a4gPDvVN-P18TsiAGnc,48609
61
- upgini-1.2.9a1.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
62
- upgini-1.2.9a1.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
63
- upgini-1.2.9a1.dist-info/RECORD,,
60
+ upgini-1.2.9a3.dist-info/METADATA,sha256=bpMUUAhh6v9AbRs2WD7Ns4PGK2kR61jPm8ITvr8-pwE,48578
61
+ upgini-1.2.9a3.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
62
+ upgini-1.2.9a3.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
63
+ upgini-1.2.9a3.dist-info/RECORD,,