upgini 1.2.27__py3-none-any.whl → 1.2.28__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.27"
1
+ __version__ = "1.2.28"
@@ -2026,7 +2026,10 @@ class FeaturesEnricher(TransformerMixin):
2026
2026
  start_time = time.time()
2027
2027
  with MDC(trace_id=trace_id):
2028
2028
  self.logger.info("Start transform")
2029
- self.__log_debug_information(X, exclude_features_sources=exclude_features_sources)
2029
+
2030
+ validated_X = self._validate_X(X, is_transform=True)
2031
+
2032
+ self.__log_debug_information(validated_X, exclude_features_sources=exclude_features_sources)
2030
2033
 
2031
2034
  self.__validate_search_keys(self.search_keys, self.search_id)
2032
2035
 
@@ -2058,8 +2061,6 @@ class FeaturesEnricher(TransformerMixin):
2058
2061
  self.logger.info(msg)
2059
2062
  print(msg)
2060
2063
 
2061
- validated_X = self._validate_X(X, is_transform=True)
2062
-
2063
2064
  is_demo_dataset = hash_input(validated_X) in DEMO_DATASET_HASHES
2064
2065
 
2065
2066
  columns_to_drop = [c for c in validated_X.columns if c in self.feature_names_]
@@ -2476,9 +2477,9 @@ class FeaturesEnricher(TransformerMixin):
2476
2477
  validate_scoring_argument(scoring)
2477
2478
 
2478
2479
  self.__log_debug_information(
2479
- X,
2480
- y,
2481
- eval_set,
2480
+ validated_X,
2481
+ validated_y,
2482
+ validated_eval_set,
2482
2483
  exclude_features_sources=exclude_features_sources,
2483
2484
  calculate_metrics=calculate_metrics,
2484
2485
  scoring=scoring,
@@ -3762,11 +3763,17 @@ class FeaturesEnricher(TransformerMixin):
3762
3763
  if len(passed_unsupported_search_keys) > 0:
3763
3764
  raise ValidationError(self.bundle.get("unsupported_search_key").format(passed_unsupported_search_keys))
3764
3765
 
3766
+ x_columns = [
3767
+ c
3768
+ for c in x.columns
3769
+ if c not in [TARGET, EVAL_SET_INDEX, SYSTEM_RECORD_ID, ENTITY_SYSTEM_RECORD_ID, SEARCH_KEY_UNNEST]
3770
+ ]
3771
+
3765
3772
  for column_id, meaning_type in search_keys.items():
3766
3773
  column_name = None
3767
3774
  if isinstance(column_id, str):
3768
3775
  if column_id not in x.columns:
3769
- raise ValidationError(self.bundle.get("search_key_not_found").format(column_id, list(x.columns)))
3776
+ raise ValidationError(self.bundle.get("search_key_not_found").format(column_id, x_columns))
3770
3777
  column_name = column_id
3771
3778
  valid_search_keys[column_name] = meaning_type
3772
3779
  elif isinstance(column_id, int):
@@ -201,7 +201,7 @@ email_detected=Emails detected in column `{}`. It will be used as a search key\n
201
201
  email_detected_not_registered=Emails detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns
202
202
  phone_detected=Phone numbers detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns
203
203
  phone_detected_not_registered=Phone numbers detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns
204
- target_type_detected=Detected task type: {}. Reason: {}\nYou can set task type manually with argument `model_task_type` of FeaturesEnricher constructor if task type detected incorrectly\n
204
+ target_type_detected=\nDetected task type: {}. Reason: {}\nYou can set task type manually with argument `model_task_type` of FeaturesEnricher constructor if task type detected incorrectly\n
205
205
  binary_target_reason=only two unique label-values observed
206
206
  non_numeric_multiclass_reason=non-numeric label values observed
207
207
  few_unique_label_multiclass_reason=few unique label-values observed and can be considered as categorical
@@ -212,7 +212,7 @@ limited_int_multiclass_reason=integer-like values with limited unique values obs
212
212
  all_ok_community_invite=❓ Support request
213
213
  too_small_for_metrics=Your train dataset or one of eval datasets contains less than 500 rows. For such dataset Upgini will not calculate accuracy metrics. Please increase the number of rows in the training dataset to calculate accuracy metrics
214
214
  imbalance_multiclass=Class {0} is on 25% quantile of classes distribution ({1} records in train dataset). \nDownsample classes with records more than {1}.
215
- imbalanced_target=Target is imbalanced and will be undersampled. Frequency of the rarest class `{}` is {}
215
+ imbalanced_target=\nTarget is imbalanced and will be undersampled. Frequency of the rarest class `{}` is {}
216
216
  loss_selection_info=Using loss `{}` for feature selection
217
217
  loss_calc_metrics_info=Using loss `{}` for metrics calculation with default estimator
218
218
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.27
3
+ Version: 1.2.28
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -1,9 +1,9 @@
1
- upgini/__about__.py,sha256=JKArgvnX6ljUI_WxYnXTejXGdjsA4KJ3Cy2xBcK4vh4,23
1
+ upgini/__about__.py,sha256=sZoYrdh97RjbwC1rg-3mt6kqvjxTxWL7ejhDDrG6mVM,23
2
2
  upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=iPFiMJtk4HF1ytw9wCQr8H9RfoOKj_TIo8XYZKWgcMc,31331
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=7xYxcLvxQgDX7vE2gWEbBPceAVeEgBVpu9xtBJvXpoQ,194078
6
+ upgini/features_enricher.py,sha256=YYboYw--vCH9VerkTnCF3njztU3fVLrhlhU3NfBVJYQ,194302
7
7
  upgini/http.py,sha256=21asexflvavydzCOONJDGQBtQanCElrbnqLXakJ9Cu8,42880
8
8
  upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
9
9
  upgini/metadata.py,sha256=osmzdNESeh7yP3BZday6N9Q3eaIHfzhhRM1d6NSgcf0,11223
@@ -30,7 +30,7 @@ upgini/normalizer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
30
30
  upgini/normalizer/normalize_utils.py,sha256=Ft2MwSgVoBilXAORAOYAuwPD79GOLfwn4qQE3IUFzzg,7218
31
31
  upgini/resource_bundle/__init__.py,sha256=S5F2G47pnJd2LDpmFsjDqEwiKkP8Hm-hcseDbMka6Ko,8345
32
32
  upgini/resource_bundle/exceptions.py,sha256=5fRvx0_vWdE1-7HcSgF0tckB4A9AKyf5RiinZkInTsI,621
33
- upgini/resource_bundle/strings.properties,sha256=l3yg9H17NwCwvfZQyOYTvXbPP6mwdXH_CGlqyxOQVFY,26669
33
+ upgini/resource_bundle/strings.properties,sha256=wn98wl2DNFPaGTMSdZAVr43P6t97i74PCqqwa762-V0,26673
34
34
  upgini/resource_bundle/strings_widget.properties,sha256=gOdqvZWntP2LCza_tyVk1_yRYcG4c04K9sQOAVhF_gw,1577
35
35
  upgini/sampler/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
36
36
  upgini/sampler/base.py,sha256=7GpjYqjOp58vYcJLiX__1R5wjUlyQbxvHJ2klFnup_M,6389
@@ -58,7 +58,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
58
58
  upgini/utils/target_utils.py,sha256=PU77nIhTz7IHbC4rpTpxrVxib6cdpRL9F1dhkjIffLY,10225
59
59
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
60
60
  upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
61
- upgini-1.2.27.dist-info/METADATA,sha256=iSB1iB7EwBugIUf8DYOz9mEFqGewDAS49-hgYuhtrtU,48578
62
- upgini-1.2.27.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
63
- upgini-1.2.27.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
64
- upgini-1.2.27.dist-info/RECORD,,
61
+ upgini-1.2.28.dist-info/METADATA,sha256=qGINKPrh43Q1LFXWRlS1v6CSpME6rOmScAy0ShKxL_0,48578
62
+ upgini-1.2.28.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
63
+ upgini-1.2.28.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
64
+ upgini-1.2.28.dist-info/RECORD,,