upgini 1.1.253a3__tar.gz → 1.1.253a5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

Files changed (83) hide show
  1. {upgini-1.1.253a3/src/upgini.egg-info → upgini-1.1.253a5}/PKG-INFO +1 -1
  2. {upgini-1.1.253a3 → upgini-1.1.253a5}/setup.py +1 -1
  3. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/features_enricher.py +4 -1
  4. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/target_utils.py +1 -1
  5. {upgini-1.1.253a3 → upgini-1.1.253a5/src/upgini.egg-info}/PKG-INFO +1 -1
  6. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_features_enricher.py +11 -10
  7. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_metrics.py +3 -3
  8. {upgini-1.1.253a3 → upgini-1.1.253a5}/LICENSE +0 -0
  9. {upgini-1.1.253a3 → upgini-1.1.253a5}/README.md +0 -0
  10. {upgini-1.1.253a3 → upgini-1.1.253a5}/pyproject.toml +0 -0
  11. {upgini-1.1.253a3 → upgini-1.1.253a5}/setup.cfg +0 -0
  12. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/__init__.py +0 -0
  13. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/ads.py +0 -0
  14. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/ads_management/__init__.py +0 -0
  15. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/ads_management/ads_manager.py +0 -0
  16. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/autofe/__init__.py +0 -0
  17. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/autofe/all_operands.py +0 -0
  18. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/autofe/binary.py +0 -0
  19. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/autofe/feature.py +0 -0
  20. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/autofe/groupby.py +0 -0
  21. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/autofe/operand.py +0 -0
  22. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/autofe/unary.py +0 -0
  23. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/autofe/vector.py +0 -0
  24. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/data_source/__init__.py +0 -0
  25. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/data_source/data_source_publisher.py +0 -0
  26. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/dataset.py +0 -0
  27. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/errors.py +0 -0
  28. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/fingerprint.js +0 -0
  29. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/http.py +0 -0
  30. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/mdc/__init__.py +0 -0
  31. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/mdc/context.py +0 -0
  32. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/metadata.py +0 -0
  33. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/metrics.py +0 -0
  34. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/normalizer/__init__.py +0 -0
  35. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/normalizer/phone_normalizer.py +0 -0
  36. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/resource_bundle/__init__.py +0 -0
  37. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/resource_bundle/exceptions.py +0 -0
  38. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/resource_bundle/strings.properties +0 -0
  39. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/resource_bundle/strings_widget.properties +0 -0
  40. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/sampler/__init__.py +0 -0
  41. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/sampler/base.py +0 -0
  42. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/sampler/random_under_sampler.py +0 -0
  43. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/sampler/utils.py +0 -0
  44. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/search_task.py +0 -0
  45. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/spinner.py +0 -0
  46. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/__init__.py +0 -0
  47. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/base_search_key_detector.py +0 -0
  48. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/blocked_time_series.py +0 -0
  49. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/country_utils.py +0 -0
  50. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/custom_loss_utils.py +0 -0
  51. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/cv_utils.py +0 -0
  52. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/datetime_utils.py +0 -0
  53. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/deduplicate_utils.py +0 -0
  54. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/display_utils.py +0 -0
  55. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/email_utils.py +0 -0
  56. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/fallback_progress_bar.py +0 -0
  57. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/features_validator.py +0 -0
  58. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/format.py +0 -0
  59. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/ip_utils.py +0 -0
  60. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/phone_utils.py +0 -0
  61. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/postal_code_utils.py +0 -0
  62. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/progress_bar.py +0 -0
  63. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/sklearn_ext.py +0 -0
  64. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/track_info.py +0 -0
  65. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/utils/warning_counter.py +0 -0
  66. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini/version_validator.py +0 -0
  67. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini.egg-info/SOURCES.txt +0 -0
  68. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini.egg-info/dependency_links.txt +0 -0
  69. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini.egg-info/requires.txt +0 -0
  70. {upgini-1.1.253a3 → upgini-1.1.253a5}/src/upgini.egg-info/top_level.txt +0 -0
  71. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_binary_dataset.py +0 -0
  72. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_blocked_time_series.py +0 -0
  73. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_categorical_dataset.py +0 -0
  74. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_continuous_dataset.py +0 -0
  75. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_country_utils.py +0 -0
  76. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_custom_loss_utils.py +0 -0
  77. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_datetime_utils.py +0 -0
  78. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_email_utils.py +0 -0
  79. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_etalon_validation.py +0 -0
  80. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_phone_utils.py +0 -0
  81. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_postal_code_utils.py +0 -0
  82. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_target_utils.py +0 -0
  83. {upgini-1.1.253a3 → upgini-1.1.253a5}/tests/test_widget.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: upgini
3
- Version: 1.1.253a3
3
+ Version: 1.1.253a5
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Home-page: https://upgini.com/
6
6
  Author: Upgini Developers
@@ -40,7 +40,7 @@ def send_log(msg: str):
40
40
 
41
41
 
42
42
  here = Path(__file__).parent.resolve()
43
- version = "1.1.253a3"
43
+ version = "1.1.253a5"
44
44
  try:
45
45
  send_log(f"Start setup PyLib version {version}")
46
46
  setup(
@@ -3022,6 +3022,7 @@ class FeaturesEnricher(TransformerMixin):
3022
3022
  return result_train, result_eval_sets
3023
3023
 
3024
3024
  def __prepare_feature_importances(self, trace_id: str, x_columns: List[str], silent=False):
3025
+ llm_source = "LLM with external data augmentation"
3025
3026
  if self._search_task is None:
3026
3027
  raise NotFittedError(self.bundle.get("transform_unfitted_enricher"))
3027
3028
  features_meta = self._search_task.get_all_features_metadata_v2()
@@ -3076,6 +3077,8 @@ class FeaturesEnricher(TransformerMixin):
3076
3077
  return ""
3077
3078
  elif not link:
3078
3079
  return value
3080
+ elif value == llm_source:
3081
+ return value
3079
3082
  else:
3080
3083
  return f"<a href='{link}' target='_blank' rel='noopener noreferrer'>{value}</a>"
3081
3084
 
@@ -3092,7 +3095,7 @@ class FeaturesEnricher(TransformerMixin):
3092
3095
  provider = to_anchor("https://upgini.com", "Upgini")
3093
3096
 
3094
3097
  internal_source = feature_meta.data_source or (
3095
- "LLM with external data augmentation"
3098
+ llm_source
3096
3099
  if not feature_meta.name.endswith("_country") and not feature_meta.name.endswith("_postal_code")
3097
3100
  else ""
3098
3101
  )
@@ -152,7 +152,7 @@ def balance_undersample(
152
152
  # fill up to min_sample_threshold by majority class
153
153
  minority_class = df[df[target_column] == min_class_value]
154
154
  majority_class = df[df[target_column] != min_class_value]
155
- sample_size = min(len(majority_class, min_sample_threshold - min_class_count))
155
+ sample_size = min(len(majority_class), min_sample_threshold - min_class_count)
156
156
  sampled_majority_class = majority_class.sample(
157
157
  n=sample_size, random_state=random_state
158
158
  )
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: upgini
3
- Version: 1.1.253a3
3
+ Version: 1.1.253a5
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Home-page: https://upgini.com/
6
6
  Author: Upgini Developers
@@ -2574,9 +2574,9 @@ def test_unsupported_arguments(requests_mock: Mocker):
2574
2574
 
2575
2575
  df = pd.DataFrame(
2576
2576
  {
2577
- "date": ["2021-01-01", "2021-01-02", "2023-01-01", "2023-01-02"],
2578
- "feature": [11, 10, 12, 13],
2579
- "target": [0, 1, 0, 1],
2577
+ "date": ["2021-01-01", "2021-01-02", "2023-01-01", "2023-01-02", "2023-01-03"],
2578
+ "feature": [11, 10, 12, 13, 14],
2579
+ "target": [0, 1, 0, 1, 0],
2580
2580
  }
2581
2581
  )
2582
2582
 
@@ -2603,13 +2603,14 @@ def test_unsupported_arguments(requests_mock: Mocker):
2603
2603
 
2604
2604
  enricher.transform(df.drop(columns="target"), "unsupported_positional_argument", unsupported_key_argument=False)
2605
2605
 
2606
- enricher.calculate_metrics(
2607
- df.drop(columns="target"),
2608
- df["target"],
2609
- [(df.drop(columns="target"), df["target"])],
2610
- "unsupported_positional_argument",
2611
- unsupported_key_argument=False,
2612
- )
2606
+ with pytest.raises(ValueError, match="Only one class present in y_true. ROC AUC score is not defined in that case."):
2607
+ enricher.calculate_metrics(
2608
+ df.drop(columns="target"),
2609
+ df["target"],
2610
+ [(df.drop(columns="target"), df["target"])],
2611
+ "unsupported_positional_argument",
2612
+ unsupported_key_argument=False,
2613
+ )
2613
2614
  finally:
2614
2615
  Dataset.MIN_ROWS_COUNT = original_min_rows
2615
2616
 
@@ -258,9 +258,9 @@ def test_demo_metrics(requests_mock: Mocker):
258
258
  segment_header: [train_segment],
259
259
  rows_header: [464],
260
260
  target_mean_header: [100.7802],
261
- baseline_mae: [21.5089],
262
- enriched_mae: [20.8841],
263
- uplift: [0.624774],
261
+ baseline_mae: [21.18862],
262
+ enriched_mae: [20.862484],
263
+ uplift: [0.326136],
264
264
  }
265
265
  )
266
266
 
File without changes
File without changes
File without changes
File without changes
File without changes