upgini 1.2.129__py3-none-any.whl → 1.2.131__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.129"
1
+ __version__ = "1.2.131"
@@ -2786,7 +2786,7 @@ if response.status_code == 200:
2786
2786
  df_without_features = df.drop(columns=features_not_to_pass, errors="ignore")
2787
2787
 
2788
2788
  df_without_features, full_duplicates_warning = clean_full_duplicates(
2789
- df_without_features, self.logger, bundle=self.bundle
2789
+ df_without_features, is_transform=True, logger=self.logger, bundle=self.bundle
2790
2790
  )
2791
2791
  if not silent_mode and full_duplicates_warning:
2792
2792
  self.__log_warning(full_duplicates_warning)
@@ -4470,7 +4470,6 @@ if response.status_code == 200:
4470
4470
  is_client_feature = original_name in clients_features_df.columns and not is_generated_feature
4471
4471
 
4472
4472
  if selected_features is not None and feature_meta.name not in selected_features:
4473
- self.logger.info(f"Feature {feature_meta.name} is not selected before and skipped")
4474
4473
  continue
4475
4474
 
4476
4475
  selected_features_meta.append(feature_meta)
@@ -31,7 +31,7 @@ def remove_fintech_duplicates(
31
31
  logger = logging.getLogger()
32
32
  logger.setLevel(logging.FATAL)
33
33
  date_col = _get_column_by_key(search_keys, [SearchKey.DATE, SearchKey.DATETIME])
34
- if define_task(df[TARGET], date_col is not None, silent=True) != ModelTaskType.BINARY:
34
+ if define_task(df[TARGET], date_col is not None, logger=logger, silent=True) != ModelTaskType.BINARY:
35
35
  return df, []
36
36
 
37
37
  if date_col is None:
@@ -160,7 +160,10 @@ def remove_fintech_duplicates(
160
160
 
161
161
 
162
162
  def clean_full_duplicates(
163
- df: pd.DataFrame, logger: Optional[Logger] = None, bundle: Optional[ResourceBundle] = None
163
+ df: pd.DataFrame,
164
+ is_transform: bool = False,
165
+ logger: Optional[Logger] = None,
166
+ bundle: Optional[ResourceBundle] = None,
164
167
  ) -> Tuple[pd.DataFrame, Optional[str]]:
165
168
  if logger is None:
166
169
  logger = logging.getLogger()
@@ -193,7 +196,7 @@ def clean_full_duplicates(
193
196
  logger.warning(bundle.get("dataset_full_duplicates").format(share_full_dedup))
194
197
 
195
198
  msg = None
196
- if TARGET in df.columns:
199
+ if not is_transform and TARGET in df.columns:
197
200
  unique_columns.remove(TARGET)
198
201
 
199
202
  # Separate rows to exclude from deduplication:
@@ -31,6 +31,7 @@ def define_task(
31
31
  ) -> ModelTaskType:
32
32
  if logger is None:
33
33
  logger = logging.getLogger()
34
+ logger.setLevel(logging.FATAL)
34
35
 
35
36
  # Replace inf and -inf with NaN to handle extreme values correctly
36
37
  y = y.replace([np.inf, -np.inf], np.nan, inplace=False)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.129
3
+ Version: 1.2.131
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -1,9 +1,9 @@
1
- upgini/__about__.py,sha256=SttPTxjmglNvCYf-RaBamJR5xyLR_He2hSyQw4Kd6PM,24
1
+ upgini/__about__.py,sha256=-xQ6-PylS50NjUgd2Mk1UC4AWxxnecclkmuHdilo22Q,24
2
2
  upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=Nm2ZmwyQqvTnymYpGUwyJWy7y2ebXlHMyYmGeGcyA_s,31652
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=s3anZTANdnK_3ff-78qYOf89q2q2AoV9_0VAjUaeDTo,234470
6
+ upgini/features_enricher.py,sha256=Tw0LqlOPUWU0lMc3ekfW0qKV9iCyNtHS0dnQFAUNnxg,234396
7
7
  upgini/http.py,sha256=-J_wOpnwVnT0ebPC6sOs6fN3AWtCD0LJLu6nlYmxaqk,44348
8
8
  upgini/metadata.py,sha256=H3wiN37k-yqWZgbPD0tJzx8DzaCIkgmX5cybhByQWLg,12619
9
9
  upgini/metrics.py,sha256=KCPE_apPN-9BIdv6GqASbJVaB_gBcy8wzNApAcyaGo4,46020
@@ -53,7 +53,7 @@ upgini/utils/country_utils.py,sha256=lY-eXWwFVegdVENFttbvLcgGDjFO17Sex8hd2PyJaRk
53
53
  upgini/utils/custom_loss_utils.py,sha256=kieNZYBYZm5ZGBltF1F_jOSF4ea6C29rYuCyiDcqVNY,3857
54
54
  upgini/utils/cv_utils.py,sha256=w6FQb9nO8BWDx88EF83NpjPLarK4eR4ia0Wg0kLBJC4,3525
55
55
  upgini/utils/datetime_utils.py,sha256=l85UzSQLhtMeI2G6m-m8y8bCColCLSXNHb2-G6fKpLM,16988
56
- upgini/utils/deduplicate_utils.py,sha256=6czbn1q0p-lOmrNvbAzueBpDHmfIP4TfV4poWqbjX5w,11255
56
+ upgini/utils/deduplicate_utils.py,sha256=CLX0QapRxB-ZVQT7yGvv1vSd2zac5SwRjCJavujdCps,11332
57
57
  upgini/utils/display_utils.py,sha256=p6o0VlYtGpU6bXv3B-fjQM9PeZEkl05OylHXSRyP0us,13219
58
58
  upgini/utils/email_utils.py,sha256=pZ2vCfNxLIPUhxr0-OlABNXm12jjU44isBk8kGmqQzA,5277
59
59
  upgini/utils/fallback_progress_bar.py,sha256=PDaKb8dYpVZaWMroNcOHsTc3pSjgi9mOm0--cOFTwJ0,1074
@@ -70,11 +70,11 @@ upgini/utils/psi.py,sha256=D_DMMBVkU4nwMospTwdMpYzNFACDxhqTuNesDngPwyY,11068
70
70
  upgini/utils/sample_utils.py,sha256=xpfYaZ2cYP7I2JrcooVc13QNBFawB81cJRuh38451Q4,15123
71
71
  upgini/utils/sklearn_ext.py,sha256=Pcy8sWD6f4YcE5Bu0UmXD4j0ICmXtrT8DJlTArM-_a0,49356
72
72
  upgini/utils/sort.py,sha256=8uuHs2nfSMVnz8GgvbOmgMB1PgEIZP1uhmeRFxcwnYw,7039
73
- upgini/utils/target_utils.py,sha256=GCPn4QeJ83JJ_vyBJ3IhY5fyIRkLC9q9BE59S2FRO1I,10882
73
+ upgini/utils/target_utils.py,sha256=CihpV6SC95HwtlMH60rGAUzVDa4Id0Bva8ySprmNHlE,10921
74
74
  upgini/utils/track_info.py,sha256=NDKeQTUlZaYp15UoP-xLKGoDoJQ0drbDMwB0g9R0PUg,6427
75
75
  upgini/utils/ts_utils.py,sha256=26vhC0pN7vLXK6R09EEkMK3Lwb9IVPH7LRdqFIQ3kPs,1383
76
76
  upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
77
- upgini-1.2.129.dist-info/METADATA,sha256=2aozj0PmbpF6Q0RnOObDK1ompytVW__7ks95a3TGkYQ,51142
78
- upgini-1.2.129.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
79
- upgini-1.2.129.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
80
- upgini-1.2.129.dist-info/RECORD,,
77
+ upgini-1.2.131.dist-info/METADATA,sha256=qYItgAJjenacNSv7cAtVxbP1m53zLmFbv6qT-ReasgE,51142
78
+ upgini-1.2.131.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
79
+ upgini-1.2.131.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
80
+ upgini-1.2.131.dist-info/RECORD,,