upgini 1.2.9a102__tar.gz → 1.2.9a103__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

Files changed (65) hide show
  1. {upgini-1.2.9a102 → upgini-1.2.9a103}/PKG-INFO +1 -1
  2. upgini-1.2.9a103/src/upgini/__about__.py +1 -0
  3. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/features_enricher.py +10 -20
  4. upgini-1.2.9a102/src/upgini/__about__.py +0 -1
  5. {upgini-1.2.9a102 → upgini-1.2.9a103}/.gitignore +0 -0
  6. {upgini-1.2.9a102 → upgini-1.2.9a103}/LICENSE +0 -0
  7. {upgini-1.2.9a102 → upgini-1.2.9a103}/README.md +0 -0
  8. {upgini-1.2.9a102 → upgini-1.2.9a103}/pyproject.toml +0 -0
  9. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/__init__.py +0 -0
  10. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/ads.py +0 -0
  11. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/ads_management/__init__.py +0 -0
  12. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/ads_management/ads_manager.py +0 -0
  13. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/__init__.py +0 -0
  14. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/all_operands.py +0 -0
  15. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/binary.py +0 -0
  16. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/date.py +0 -0
  17. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/feature.py +0 -0
  18. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/groupby.py +0 -0
  19. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/operand.py +0 -0
  20. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/unary.py +0 -0
  21. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/autofe/vector.py +0 -0
  22. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/data_source/__init__.py +0 -0
  23. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/data_source/data_source_publisher.py +0 -0
  24. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/dataset.py +0 -0
  25. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/errors.py +0 -0
  26. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/http.py +0 -0
  27. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/lazy_import.py +0 -0
  28. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/mdc/__init__.py +0 -0
  29. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/mdc/context.py +0 -0
  30. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/metadata.py +0 -0
  31. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/metrics.py +0 -0
  32. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/normalizer/__init__.py +0 -0
  33. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/normalizer/normalize_utils.py +0 -0
  34. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/resource_bundle/__init__.py +0 -0
  35. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/resource_bundle/exceptions.py +0 -0
  36. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/resource_bundle/strings.properties +0 -0
  37. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/resource_bundle/strings_widget.properties +0 -0
  38. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/sampler/__init__.py +0 -0
  39. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/sampler/base.py +0 -0
  40. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/sampler/random_under_sampler.py +0 -0
  41. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/sampler/utils.py +0 -0
  42. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/search_task.py +0 -0
  43. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/spinner.py +0 -0
  44. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/__init__.py +0 -0
  45. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/base_search_key_detector.py +0 -0
  46. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/blocked_time_series.py +0 -0
  47. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/country_utils.py +0 -0
  48. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/custom_loss_utils.py +0 -0
  49. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/cv_utils.py +0 -0
  50. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/datetime_utils.py +0 -0
  51. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/deduplicate_utils.py +0 -0
  52. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/display_utils.py +0 -0
  53. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/email_utils.py +0 -0
  54. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/fallback_progress_bar.py +0 -0
  55. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/features_validator.py +0 -0
  56. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/format.py +0 -0
  57. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/ip_utils.py +0 -0
  58. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/phone_utils.py +0 -0
  59. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/postal_code_utils.py +0 -0
  60. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/progress_bar.py +0 -0
  61. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/sklearn_ext.py +0 -0
  62. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/target_utils.py +0 -0
  63. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/track_info.py +0 -0
  64. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/utils/warning_counter.py +0 -0
  65. {upgini-1.2.9a102 → upgini-1.2.9a103}/src/upgini/version_validator.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.9a102
3
+ Version: 1.2.9a103
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -0,0 +1 @@
1
+ __version__ = "1.2.9a103"
@@ -1369,6 +1369,7 @@ class FeaturesEnricher(TransformerMixin):
1369
1369
  + [DateTimeSearchKeyConverter.DATETIME_COL, SYSTEM_RECORD_ID, ENTITY_SYSTEM_RECORD_ID]
1370
1370
  )
1371
1371
  ]
1372
+ self.logger.info(f"Client features column on prepare data for metrics: {client_features}")
1372
1373
 
1373
1374
  filtered_enriched_features = self.__filtered_enriched_features(
1374
1375
  importance_threshold,
@@ -1435,31 +1436,19 @@ class FeaturesEnricher(TransformerMixin):
1435
1436
  )
1436
1437
 
1437
1438
  fitting_eval_set_dict = {}
1439
+ fitting_x_columns = fitting_X.columns.to_list()
1440
+ self.logger.info(f"Final list of fitting X columns: {fitting_x_columns}")
1441
+ fitting_enriched_x_columns = fitting_enriched_X.columns.to_list()
1442
+ self.logger.info(f"Final list of fitting enriched X columns: {fitting_enriched_x_columns}")
1438
1443
  for idx, eval_tuple in eval_set_sampled_dict.items():
1439
1444
  eval_X_sampled, enriched_eval_X, eval_y_sampled = eval_tuple
1440
1445
  eval_X_sorted, eval_y_sorted = self._sort_by_system_record_id(eval_X_sampled, eval_y_sampled, self.cv)
1441
1446
  enriched_eval_X_sorted, enriched_eval_y_sorted = self._sort_by_system_record_id(
1442
1447
  enriched_eval_X, eval_y_sampled, self.cv
1443
1448
  )
1444
- fitting_eval_X = eval_X_sorted[client_features].copy()
1445
- fitting_enriched_eval_X = enriched_eval_X_sorted[
1446
- client_features + existing_filtered_enriched_features
1447
- ].copy()
1448
-
1449
- # # Drop high cardinality features in eval set
1450
- if len(columns_with_high_cardinality) > 0:
1451
- fitting_eval_X = fitting_eval_X.drop(columns=columns_with_high_cardinality, errors="ignore")
1452
- fitting_enriched_eval_X = fitting_enriched_eval_X.drop(
1453
- columns=columns_with_high_cardinality, errors="ignore"
1454
- )
1455
- # Drop constant features in eval_set
1456
- if len(constant_columns) > 0:
1457
- fitting_eval_X = fitting_eval_X.drop(columns=constant_columns, errors="ignore")
1458
- fitting_enriched_eval_X = fitting_enriched_eval_X.drop(columns=constant_columns, errors="ignore")
1459
- # Drop datetime features in eval_set
1460
- if len(datetime_features) > 0:
1461
- fitting_eval_X = fitting_eval_X.drop(columns=datetime_features, errors="ignore")
1462
- fitting_enriched_eval_X = fitting_enriched_eval_X.drop(columns=datetime_features, errors="ignore")
1449
+ fitting_eval_X = eval_X_sorted[fitting_x_columns].copy()
1450
+ fitting_enriched_eval_X = enriched_eval_X_sorted[fitting_enriched_x_columns].copy()
1451
+
1463
1452
  # Convert bool to string in eval_set
1464
1453
  if len(bool_columns) > 0:
1465
1454
  fitting_eval_X[col] = fitting_eval_X[col].astype(str)
@@ -1680,6 +1669,7 @@ class FeaturesEnricher(TransformerMixin):
1680
1669
  X_sampled = enriched_Xy[x_columns].copy()
1681
1670
  y_sampled = enriched_Xy[TARGET].copy()
1682
1671
  enriched_X = enriched_Xy.drop(columns=[TARGET, EVAL_SET_INDEX], errors="ignore")
1672
+ enriched_X_columns = enriched_X.columns.to_list()
1683
1673
 
1684
1674
  self.logger.info(f"Shape of enriched_X: {enriched_X.shape}")
1685
1675
  self.logger.info(f"Shape of X after sampling: {X_sampled.shape}")
@@ -1694,7 +1684,7 @@ class FeaturesEnricher(TransformerMixin):
1694
1684
  for idx in range(len(eval_set)):
1695
1685
  eval_X_sampled = enriched_eval_sets[idx + 1][x_columns].copy()
1696
1686
  eval_y_sampled = enriched_eval_sets[idx + 1][TARGET].copy()
1697
- enriched_eval_X = enriched_eval_sets[idx + 1].drop(columns=[TARGET, EVAL_SET_INDEX])
1687
+ enriched_eval_X = enriched_eval_sets[idx + 1][enriched_X_columns].copy()
1698
1688
  eval_set_sampled_dict[idx] = (eval_X_sampled, enriched_eval_X, eval_y_sampled)
1699
1689
 
1700
1690
  self.__cached_sampled_datasets = (
@@ -1 +0,0 @@
1
- __version__ = "1.2.9a102"
File without changes
File without changes
File without changes
File without changes
File without changes