upgini 1.2.129__tar.gz → 1.2.131__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

Files changed (82) hide show
  1. {upgini-1.2.129 → upgini-1.2.131}/PKG-INFO +1 -1
  2. upgini-1.2.131/src/upgini/__about__.py +1 -0
  3. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/features_enricher.py +1 -2
  4. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/deduplicate_utils.py +6 -3
  5. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/target_utils.py +1 -0
  6. upgini-1.2.129/src/upgini/__about__.py +0 -1
  7. {upgini-1.2.129 → upgini-1.2.131}/.gitignore +0 -0
  8. {upgini-1.2.129 → upgini-1.2.131}/LICENSE +0 -0
  9. {upgini-1.2.129 → upgini-1.2.131}/README.md +0 -0
  10. {upgini-1.2.129 → upgini-1.2.131}/pyproject.toml +0 -0
  11. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/__init__.py +0 -0
  12. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/ads.py +0 -0
  13. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/ads_management/__init__.py +0 -0
  14. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/ads_management/ads_manager.py +0 -0
  15. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/__init__.py +0 -0
  16. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/all_operators.py +0 -0
  17. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/binary.py +0 -0
  18. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/date.py +0 -0
  19. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/feature.py +0 -0
  20. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/groupby.py +0 -0
  21. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/operator.py +0 -0
  22. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/timeseries/__init__.py +0 -0
  23. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/timeseries/base.py +0 -0
  24. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/timeseries/cross.py +0 -0
  25. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/timeseries/delta.py +0 -0
  26. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/timeseries/lag.py +0 -0
  27. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/timeseries/roll.py +0 -0
  28. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/timeseries/trend.py +0 -0
  29. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/timeseries/volatility.py +0 -0
  30. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/unary.py +0 -0
  31. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/utils.py +0 -0
  32. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/autofe/vector.py +0 -0
  33. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/data_source/__init__.py +0 -0
  34. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/data_source/data_source_publisher.py +0 -0
  35. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/dataset.py +0 -0
  36. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/errors.py +0 -0
  37. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/http.py +0 -0
  38. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/mdc/__init__.py +0 -0
  39. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/mdc/context.py +0 -0
  40. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/metadata.py +0 -0
  41. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/metrics.py +0 -0
  42. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/normalizer/__init__.py +0 -0
  43. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/normalizer/normalize_utils.py +0 -0
  44. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/resource_bundle/__init__.py +0 -0
  45. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/resource_bundle/exceptions.py +0 -0
  46. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/resource_bundle/strings.properties +0 -0
  47. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/resource_bundle/strings_widget.properties +0 -0
  48. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/sampler/__init__.py +0 -0
  49. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/sampler/base.py +0 -0
  50. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/sampler/random_under_sampler.py +0 -0
  51. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/sampler/utils.py +0 -0
  52. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/search_task.py +0 -0
  53. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/spinner.py +0 -0
  54. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/Roboto-Regular.ttf +0 -0
  55. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/__init__.py +0 -0
  56. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/base_search_key_detector.py +0 -0
  57. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/blocked_time_series.py +0 -0
  58. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/config.py +0 -0
  59. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/country_utils.py +0 -0
  60. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/custom_loss_utils.py +0 -0
  61. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/cv_utils.py +0 -0
  62. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/datetime_utils.py +0 -0
  63. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/display_utils.py +0 -0
  64. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/email_utils.py +0 -0
  65. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/fallback_progress_bar.py +0 -0
  66. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/feature_info.py +0 -0
  67. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/features_validator.py +0 -0
  68. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/format.py +0 -0
  69. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/hash_utils.py +0 -0
  70. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/ip_utils.py +0 -0
  71. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/mstats.py +0 -0
  72. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/phone_utils.py +0 -0
  73. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/postal_code_utils.py +0 -0
  74. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/progress_bar.py +0 -0
  75. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/psi.py +0 -0
  76. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/sample_utils.py +0 -0
  77. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/sklearn_ext.py +0 -0
  78. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/sort.py +0 -0
  79. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/track_info.py +0 -0
  80. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/ts_utils.py +0 -0
  81. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/utils/warning_counter.py +0 -0
  82. {upgini-1.2.129 → upgini-1.2.131}/src/upgini/version_validator.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.129
3
+ Version: 1.2.131
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -0,0 +1 @@
1
+ __version__ = "1.2.131"
@@ -2786,7 +2786,7 @@ if response.status_code == 200:
2786
2786
  df_without_features = df.drop(columns=features_not_to_pass, errors="ignore")
2787
2787
 
2788
2788
  df_without_features, full_duplicates_warning = clean_full_duplicates(
2789
- df_without_features, self.logger, bundle=self.bundle
2789
+ df_without_features, is_transform=True, logger=self.logger, bundle=self.bundle
2790
2790
  )
2791
2791
  if not silent_mode and full_duplicates_warning:
2792
2792
  self.__log_warning(full_duplicates_warning)
@@ -4470,7 +4470,6 @@ if response.status_code == 200:
4470
4470
  is_client_feature = original_name in clients_features_df.columns and not is_generated_feature
4471
4471
 
4472
4472
  if selected_features is not None and feature_meta.name not in selected_features:
4473
- self.logger.info(f"Feature {feature_meta.name} is not selected before and skipped")
4474
4473
  continue
4475
4474
 
4476
4475
  selected_features_meta.append(feature_meta)
@@ -31,7 +31,7 @@ def remove_fintech_duplicates(
31
31
  logger = logging.getLogger()
32
32
  logger.setLevel(logging.FATAL)
33
33
  date_col = _get_column_by_key(search_keys, [SearchKey.DATE, SearchKey.DATETIME])
34
- if define_task(df[TARGET], date_col is not None, silent=True) != ModelTaskType.BINARY:
34
+ if define_task(df[TARGET], date_col is not None, logger=logger, silent=True) != ModelTaskType.BINARY:
35
35
  return df, []
36
36
 
37
37
  if date_col is None:
@@ -160,7 +160,10 @@ def remove_fintech_duplicates(
160
160
 
161
161
 
162
162
  def clean_full_duplicates(
163
- df: pd.DataFrame, logger: Optional[Logger] = None, bundle: Optional[ResourceBundle] = None
163
+ df: pd.DataFrame,
164
+ is_transform: bool = False,
165
+ logger: Optional[Logger] = None,
166
+ bundle: Optional[ResourceBundle] = None,
164
167
  ) -> Tuple[pd.DataFrame, Optional[str]]:
165
168
  if logger is None:
166
169
  logger = logging.getLogger()
@@ -193,7 +196,7 @@ def clean_full_duplicates(
193
196
  logger.warning(bundle.get("dataset_full_duplicates").format(share_full_dedup))
194
197
 
195
198
  msg = None
196
- if TARGET in df.columns:
199
+ if not is_transform and TARGET in df.columns:
197
200
  unique_columns.remove(TARGET)
198
201
 
199
202
  # Separate rows to exclude from deduplication:
@@ -31,6 +31,7 @@ def define_task(
31
31
  ) -> ModelTaskType:
32
32
  if logger is None:
33
33
  logger = logging.getLogger()
34
+ logger.setLevel(logging.FATAL)
34
35
 
35
36
  # Replace inf and -inf with NaN to handle extreme values correctly
36
37
  y = y.replace([np.inf, -np.inf], np.nan, inplace=False)
@@ -1 +0,0 @@
1
- __version__ = "1.2.129"
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes