upgini 1.2.9a3__py3-none-any.whl → 1.2.9a99__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.9a3"
1
+ __version__ = "1.2.9a99"
@@ -2531,7 +2531,7 @@ class FeaturesEnricher(TransformerMixin):
2531
2531
  features_columns = [c for c in df.columns if c not in non_feature_columns]
2532
2532
 
2533
2533
  features_to_drop = FeaturesValidator(self.logger).validate(
2534
- df, features_columns, self.generate_features, columns_renaming, self.warning_counter
2534
+ df, features_columns, self.generate_features, self.warning_counter
2535
2535
  )
2536
2536
  self.fit_dropped_features.update(features_to_drop)
2537
2537
  df = df.drop(columns=features_to_drop)
@@ -2657,7 +2657,7 @@ class FeaturesEnricher(TransformerMixin):
2657
2657
  and len(self._search_task.unused_features_for_generation) > 0
2658
2658
  ):
2659
2659
  unused_features_for_generation = [
2660
- columns_renaming.get(col) or col for col in self._search_task.unused_features_for_generation
2660
+ dataset.columns_renaming.get(col) or col for col in self._search_task.unused_features_for_generation
2661
2661
  ]
2662
2662
  msg = self.bundle.get("features_not_generated").format(unused_features_for_generation)
2663
2663
  self.logger.warning(msg)
upgini/metrics.py CHANGED
@@ -10,6 +10,7 @@ import catboost
10
10
  import numpy as np
11
11
  import pandas as pd
12
12
  from catboost import CatBoostClassifier, CatBoostRegressor
13
+ from lightgbm import LGBMClassifier, LGBMRegressor
13
14
  from numpy import log1p
14
15
  from pandas.api.types import is_numeric_dtype
15
16
  from sklearn.metrics import check_scoring, get_scorer, make_scorer, roc_auc_score
@@ -405,7 +406,6 @@ class EstimatorWrapper:
405
406
  estimator = CatBoostWrapper(**kwargs)
406
407
  else:
407
408
  try:
408
- from lightgbm import LGBMClassifier, LGBMRegressor
409
409
  if isinstance(estimator, (LGBMClassifier, LGBMRegressor)):
410
410
  estimator = LightGBMWrapper(**kwargs)
411
411
  else:
@@ -486,7 +486,7 @@ class CatBoostWrapper(EstimatorWrapper):
486
486
 
487
487
  # Find rest categorical features
488
488
  self.cat_features = _get_cat_features(x, self.text_features, embedding_features)
489
- # x = fill_na_cat_features(x, self.cat_features)
489
+ x = fill_na_cat_features(x, self.cat_features) # Was commented
490
490
  unique_cat_features = []
491
491
  for name in self.cat_features:
492
492
  # Remove constant categorical features
@@ -536,7 +536,7 @@ class CatBoostWrapper(EstimatorWrapper):
536
536
  x, emb_columns = self.group_embeddings(x)
537
537
  params["embedding_features"] = emb_columns
538
538
  if self.cat_features:
539
- # x = fill_na_cat_features(x, self.cat_features)
539
+ x = fill_na_cat_features(x, self.cat_features) # Was commented
540
540
  params["cat_features"] = self.cat_features
541
541
 
542
542
  return x, y, params
@@ -1,6 +1,6 @@
1
1
  import logging
2
2
  from logging import Logger
3
- from typing import Dict, List, Optional
3
+ from typing import List, Optional
4
4
 
5
5
  import pandas as pd
6
6
  from pandas.api.types import is_integer_dtype, is_object_dtype, is_string_dtype
@@ -22,7 +22,6 @@ class FeaturesValidator:
22
22
  df: pd.DataFrame,
23
23
  features: List[str],
24
24
  features_for_generate: Optional[List[str]],
25
- columns_renaming: Dict[str, str],
26
25
  warning_counter: WarningCounter,
27
26
  ) -> List[str]:
28
27
  # one_hot_encoded_features = []
@@ -64,7 +63,7 @@ class FeaturesValidator:
64
63
 
65
64
  high_cardinality_features = self.find_high_cardinality(df[features])
66
65
  if features_for_generate:
67
- high_cardinality_features = [f for f in high_cardinality_features if columns_renaming[f] not in features_for_generate]
66
+ high_cardinality_features = [f for f in high_cardinality_features if f not in features_for_generate]
68
67
  if high_cardinality_features:
69
68
  msg = bundle.get("high_cardinality_features").format(high_cardinality_features)
70
69
  print(msg)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.9a3
3
+ Version: 1.2.9a99
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -28,6 +28,7 @@ Requires-Dist: fastparquet>=0.8.1
28
28
  Requires-Dist: ipywidgets>=8.1.0
29
29
  Requires-Dist: jarowinkler>=2.0.0
30
30
  Requires-Dist: levenshtein>=0.25.1
31
+ Requires-Dist: lightgbm>=3.3.2
31
32
  Requires-Dist: numpy<=1.26.4,>=1.19.0
32
33
  Requires-Dist: pandas<3.0.0,>=1.1.0
33
34
  Requires-Dist: pydantic<3.0.0,>1.0.0
@@ -1,13 +1,13 @@
1
- upgini/__about__.py,sha256=r3QIbFOSJMAs6ONA-HrOMmqgGlWw7zq9CfF__Tf43EE,24
1
+ upgini/__about__.py,sha256=GPfVcGLNLsPn7GOGxyUAePD4tmtosYALOutsKNehkhs,25
2
2
  upgini/__init__.py,sha256=M64LwQTBa-5Jz24Zm2h8rWwlKQQ1J8nP7gGgIciS0WU,589
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=olZ-OHSfBNoBSCo7R5t7uCLukI2nO7afpx_A-HCiJLk,31067
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=cnNZ5e_uyU5f3cHumeeVBI1PZFn3DKcuTNBz0XRCEDU,188144
6
+ upgini/features_enricher.py,sha256=J5-bn07iaJSXVN8COeu2RbDqZ4NTPd1L27HePaNh52o,188134
7
7
  upgini/http.py,sha256=21asexflvavydzCOONJDGQBtQanCElrbnqLXakJ9Cu8,42880
8
8
  upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
9
9
  upgini/metadata.py,sha256=osmzdNESeh7yP3BZday6N9Q3eaIHfzhhRM1d6NSgcf0,11223
10
- upgini/metrics.py,sha256=AYVvcqSqO_UWwFIby0gcqSDNLiIoy6EU3pa8aUBUQ4k,30946
10
+ upgini/metrics.py,sha256=d4r20WhuYxsdSwDXU0M0Ny40K3QBuQuckOOvOlat48Y,30956
11
11
  upgini/search_task.py,sha256=qxUxAD-bed-FpZYmTB_4orW7YJsW_O6a1TcgnZIRFr4,17307
12
12
  upgini/spinner.py,sha256=4iMd-eIe_BnkqFEMIliULTbj6rNI2HkN_VJ4qYe0cUc,1118
13
13
  upgini/version_validator.py,sha256=ddSKUK_-eGJB3NgrqOMoWJU-OxQ253WsNLp8aqJkaIM,1389
@@ -47,7 +47,7 @@ upgini/utils/deduplicate_utils.py,sha256=Zvs7zW4QzaERQmJNPrTVf2ZTVBkBLOycFCzyMwt
47
47
  upgini/utils/display_utils.py,sha256=A2ouB5eiZ-Kyt9ykYxkLQwyoRPrdYeJymwNTiajtFXs,10990
48
48
  upgini/utils/email_utils.py,sha256=j0Ug1R_0AnCg1Y92zIZ4XMwvKo3G5_pcOlBN1OH_gZs,5191
49
49
  upgini/utils/fallback_progress_bar.py,sha256=PDaKb8dYpVZaWMroNcOHsTc3pSjgi9mOm0--cOFTwJ0,1074
50
- upgini/utils/features_validator.py,sha256=Vu-zQ-QoxDG0tQfkqQy_il9dQDkyiZadKBpr6izKAe0,3373
50
+ upgini/utils/features_validator.py,sha256=PgKNt5dyqfErTvjtRNNUS9g7GFqHBtAtnsfA-V5UO1A,3307
51
51
  upgini/utils/format.py,sha256=Yv5cvvSs2bOLUzzNu96Pu33VMDNbabio92QepUj41jU,243
52
52
  upgini/utils/ip_utils.py,sha256=Q6vb7Sr5Khx3Sq3eENjW2qCXKej_S5jZbneH6zEOkzQ,5171
53
53
  upgini/utils/phone_utils.py,sha256=IrbztLuOJBiePqqxllfABWfYlfAjYevPhXKipl95wUI,10432
@@ -57,7 +57,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
57
57
  upgini/utils/target_utils.py,sha256=BVtDmrmFMKerSUWaNOIEdzsYHIFiODdpnWbE50QDPDc,7864
58
58
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
59
59
  upgini/utils/warning_counter.py,sha256=dIWBB4dI5XRRJZudvIlqlIYKEiwLLPcXarsZuYRt338,227
60
- upgini-1.2.9a3.dist-info/METADATA,sha256=bpMUUAhh6v9AbRs2WD7Ns4PGK2kR61jPm8ITvr8-pwE,48578
61
- upgini-1.2.9a3.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
62
- upgini-1.2.9a3.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
63
- upgini-1.2.9a3.dist-info/RECORD,,
60
+ upgini-1.2.9a99.dist-info/METADATA,sha256=YA-Hrmg8rsT_cDBcvN1hRbHHsfYUXtYtbKaGNc40X5M,48610
61
+ upgini-1.2.9a99.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
62
+ upgini-1.2.9a99.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
63
+ upgini-1.2.9a99.dist-info/RECORD,,