upgini 1.2.155.dev1__tar.gz → 1.2.155.dev2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (83) hide show
  1. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/PKG-INFO +1 -1
  2. upgini-1.2.155.dev2/src/upgini/__about__.py +1 -0
  3. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/features_enricher.py +19 -3
  4. upgini-1.2.155.dev1/src/upgini/__about__.py +0 -1
  5. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/.gitignore +0 -0
  6. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/LICENSE +0 -0
  7. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/README.md +0 -0
  8. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/pyproject.toml +0 -0
  9. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/__init__.py +0 -0
  10. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/ads.py +0 -0
  11. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/ads_management/__init__.py +0 -0
  12. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/ads_management/ads_manager.py +0 -0
  13. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/__init__.py +0 -0
  14. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/all_operators.py +0 -0
  15. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/binary.py +0 -0
  16. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/date.py +0 -0
  17. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/feature.py +0 -0
  18. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/groupby.py +0 -0
  19. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/operator.py +0 -0
  20. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/timeseries/__init__.py +0 -0
  21. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/timeseries/base.py +0 -0
  22. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/timeseries/cross.py +0 -0
  23. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/timeseries/delta.py +0 -0
  24. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/timeseries/lag.py +0 -0
  25. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/timeseries/roll.py +0 -0
  26. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/timeseries/trend.py +0 -0
  27. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/timeseries/volatility.py +0 -0
  28. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/unary.py +0 -0
  29. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/utils.py +0 -0
  30. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/autofe/vector.py +0 -0
  31. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/data_source/__init__.py +0 -0
  32. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/data_source/data_source_publisher.py +0 -0
  33. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/dataset.py +0 -0
  34. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/errors.py +0 -0
  35. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/http.py +0 -0
  36. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/mdc/__init__.py +0 -0
  37. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/mdc/context.py +0 -0
  38. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/metadata.py +0 -0
  39. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/metrics.py +0 -0
  40. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/normalizer/__init__.py +0 -0
  41. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/normalizer/normalize_utils.py +0 -0
  42. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/resource_bundle/__init__.py +0 -0
  43. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/resource_bundle/exceptions.py +0 -0
  44. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/resource_bundle/strings.properties +0 -0
  45. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/resource_bundle/strings_widget.properties +0 -0
  46. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/sampler/__init__.py +0 -0
  47. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/sampler/base.py +0 -0
  48. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/sampler/random_under_sampler.py +0 -0
  49. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/sampler/utils.py +0 -0
  50. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/search_task.py +0 -0
  51. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/spinner.py +0 -0
  52. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/Roboto-Regular.ttf +0 -0
  53. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/__init__.py +0 -0
  54. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/base_search_key_detector.py +0 -0
  55. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/blocked_time_series.py +0 -0
  56. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/config.py +0 -0
  57. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/country_utils.py +0 -0
  58. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/custom_loss_utils.py +0 -0
  59. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/cv_utils.py +0 -0
  60. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/datetime_utils.py +0 -0
  61. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/deduplicate_utils.py +0 -0
  62. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/display_utils.py +0 -0
  63. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/email_utils.py +0 -0
  64. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/fallback_progress_bar.py +0 -0
  65. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/feature_info.py +0 -0
  66. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/features_validator.py +0 -0
  67. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/format.py +0 -0
  68. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/hash_utils.py +0 -0
  69. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/ip_utils.py +0 -0
  70. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/mstats.py +0 -0
  71. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/one_hot_encoder.py +0 -0
  72. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/phone_utils.py +0 -0
  73. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/postal_code_utils.py +0 -0
  74. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/progress_bar.py +0 -0
  75. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/psi.py +0 -0
  76. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/sample_utils.py +0 -0
  77. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/sklearn_ext.py +0 -0
  78. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/sort.py +0 -0
  79. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/target_utils.py +0 -0
  80. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/track_info.py +0 -0
  81. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/ts_utils.py +0 -0
  82. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/utils/warning_counter.py +0 -0
  83. {upgini-1.2.155.dev1 → upgini-1.2.155.dev2}/src/upgini/version_validator.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.155.dev1
3
+ Version: 1.2.155.dev2
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -0,0 +1 @@
1
+ __version__ = "1.2.155.dev2"
@@ -1537,10 +1537,15 @@ class FeaturesEnricher(TransformerMixin):
1537
1537
 
1538
1538
  checking_eval_set_df[date_column] = date_converter.to_date_ms(eval_set_dates[selected_eval_set_idx].to_frame())
1539
1539
 
1540
- cat_features = [c for c in cat_features if c in checking_eval_set_df.columns]
1540
+ baseline_score_column = self._get_renamed_baseline_score_column()
1541
+ psi_df = checking_eval_set_df
1542
+ if baseline_score_column and baseline_score_column in psi_df.columns:
1543
+ psi_df = psi_df.drop(columns=[baseline_score_column])
1544
+
1545
+ cat_features = [c for c in cat_features if c in psi_df.columns]
1541
1546
 
1542
1547
  psi_values_sparse = calculate_sparsity_psi(
1543
- checking_eval_set_df, cat_features, date_column, self.logger, model_task_type
1548
+ psi_df, cat_features, date_column, self.logger, model_task_type
1544
1549
  )
1545
1550
 
1546
1551
  self.logger.info(f"PSI values by sparsity: {psi_values_sparse}")
@@ -1550,7 +1555,7 @@ class FeaturesEnricher(TransformerMixin):
1550
1555
  self.logger.info(f"Unstable by sparsity features ({stability_threshold}): {sorted(unstable_by_sparsity)}")
1551
1556
 
1552
1557
  psi_values = calculate_features_psi(
1553
- checking_eval_set_df, cat_features, date_column, self.logger, model_task_type, stability_agg_func
1558
+ psi_df, cat_features, date_column, self.logger, model_task_type, stability_agg_func
1554
1559
  )
1555
1560
 
1556
1561
  self.logger.info(f"PSI values by value: {psi_values}")
@@ -1564,6 +1569,8 @@ class FeaturesEnricher(TransformerMixin):
1564
1569
  }
1565
1570
 
1566
1571
  total_unstable_features = sorted(set(unstable_by_sparsity + unstable_by_value))
1572
+ if baseline_score_column:
1573
+ total_unstable_features = [f for f in total_unstable_features if f != baseline_score_column]
1567
1574
 
1568
1575
  return total_unstable_features
1569
1576
 
@@ -1753,6 +1760,15 @@ class FeaturesEnricher(TransformerMixin):
1753
1760
  raise ValidationError(self.bundle.get("cat_feature_search_key").format(cat_feature))
1754
1761
  return cat_features, search_keys_for_metrics
1755
1762
 
1763
+ def _get_renamed_baseline_score_column(self, columns_renaming: dict[str, str] | None = None) -> str | None:
1764
+ if self.baseline_score_column is None:
1765
+ return None
1766
+ if columns_renaming:
1767
+ return columns_renaming.get(self.baseline_score_column, self.baseline_score_column)
1768
+ if self.fit_columns_renaming:
1769
+ return self.fit_columns_renaming.get(self.baseline_score_column, self.baseline_score_column)
1770
+ return self.baseline_score_column
1771
+
1756
1772
  def _get_cat_features_for_psi(
1757
1773
  self,
1758
1774
  client_cat_features: list[str] | None,
@@ -1 +0,0 @@
1
- __version__ = "1.2.155.dev1"
File without changes
File without changes
File without changes