upgini 1.1.244a16__tar.gz → 1.1.244a18__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

Files changed (81) hide show
  1. {upgini-1.1.244a16/src/upgini.egg-info → upgini-1.1.244a18}/PKG-INFO +1 -1
  2. {upgini-1.1.244a16 → upgini-1.1.244a18}/setup.py +1 -1
  3. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/features_enricher.py +3 -1
  4. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/metrics.py +2 -2
  5. {upgini-1.1.244a16 → upgini-1.1.244a18/src/upgini.egg-info}/PKG-INFO +1 -1
  6. {upgini-1.1.244a16 → upgini-1.1.244a18}/LICENSE +0 -0
  7. {upgini-1.1.244a16 → upgini-1.1.244a18}/README.md +0 -0
  8. {upgini-1.1.244a16 → upgini-1.1.244a18}/pyproject.toml +0 -0
  9. {upgini-1.1.244a16 → upgini-1.1.244a18}/setup.cfg +0 -0
  10. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/__init__.py +0 -0
  11. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/ads.py +0 -0
  12. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/ads_management/__init__.py +0 -0
  13. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/ads_management/ads_manager.py +0 -0
  14. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/autofe/__init__.py +0 -0
  15. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/autofe/all_operands.py +0 -0
  16. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/autofe/binary.py +0 -0
  17. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/autofe/feature.py +0 -0
  18. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/autofe/groupby.py +0 -0
  19. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/autofe/operand.py +0 -0
  20. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/autofe/unary.py +0 -0
  21. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/autofe/vector.py +0 -0
  22. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/data_source/__init__.py +0 -0
  23. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/data_source/data_source_publisher.py +0 -0
  24. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/dataset.py +0 -0
  25. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/errors.py +0 -0
  26. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/fingerprint.js +0 -0
  27. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/http.py +0 -0
  28. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/mdc/__init__.py +0 -0
  29. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/mdc/context.py +0 -0
  30. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/metadata.py +0 -0
  31. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/normalizer/__init__.py +0 -0
  32. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/normalizer/phone_normalizer.py +0 -0
  33. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/resource_bundle/__init__.py +0 -0
  34. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/resource_bundle/exceptions.py +0 -0
  35. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/resource_bundle/strings.properties +0 -0
  36. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/sampler/__init__.py +0 -0
  37. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/sampler/base.py +0 -0
  38. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/sampler/random_under_sampler.py +0 -0
  39. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/sampler/utils.py +0 -0
  40. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/search_task.py +0 -0
  41. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/spinner.py +0 -0
  42. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/__init__.py +0 -0
  43. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/base_search_key_detector.py +0 -0
  44. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/blocked_time_series.py +0 -0
  45. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/country_utils.py +0 -0
  46. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/custom_loss_utils.py +0 -0
  47. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/cv_utils.py +0 -0
  48. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/datetime_utils.py +0 -0
  49. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/deduplicate_utils.py +0 -0
  50. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/display_utils.py +0 -0
  51. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/email_utils.py +0 -0
  52. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/fallback_progress_bar.py +0 -0
  53. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/features_validator.py +0 -0
  54. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/format.py +0 -0
  55. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/ip_utils.py +0 -0
  56. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/phone_utils.py +0 -0
  57. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/postal_code_utils.py +0 -0
  58. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/progress_bar.py +0 -0
  59. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/sklearn_ext.py +0 -0
  60. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/target_utils.py +0 -0
  61. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/track_info.py +0 -0
  62. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/utils/warning_counter.py +0 -0
  63. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini/version_validator.py +0 -0
  64. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini.egg-info/SOURCES.txt +0 -0
  65. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini.egg-info/dependency_links.txt +0 -0
  66. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini.egg-info/requires.txt +0 -0
  67. {upgini-1.1.244a16 → upgini-1.1.244a18}/src/upgini.egg-info/top_level.txt +0 -0
  68. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_binary_dataset.py +0 -0
  69. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_blocked_time_series.py +0 -0
  70. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_categorical_dataset.py +0 -0
  71. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_continuous_dataset.py +0 -0
  72. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_country_utils.py +0 -0
  73. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_custom_loss_utils.py +0 -0
  74. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_datetime_utils.py +0 -0
  75. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_email_utils.py +0 -0
  76. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_etalon_validation.py +0 -0
  77. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_features_enricher.py +0 -0
  78. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_metrics.py +0 -0
  79. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_phone_utils.py +0 -0
  80. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_postal_code_utils.py +0 -0
  81. {upgini-1.1.244a16 → upgini-1.1.244a18}/tests/test_widget.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: upgini
3
- Version: 1.1.244a16
3
+ Version: 1.1.244a18
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Home-page: https://upgini.com/
6
6
  Author: Upgini Developers
@@ -40,7 +40,7 @@ def send_log(msg: str):
40
40
 
41
41
 
42
42
  here = Path(__file__).parent.resolve()
43
- version = "1.1.244a16"
43
+ version = "1.1.244a18"
44
44
  try:
45
45
  send_log(f"Start setup PyLib version {version}")
46
46
  setup(
@@ -1337,7 +1337,9 @@ class FeaturesEnricher(TransformerMixin):
1337
1337
 
1338
1338
  # Detect and drop high cardinality columns in train
1339
1339
  columns_with_high_cardinality = FeaturesValidator.find_high_cardinality(fitting_X)
1340
- columns_with_high_cardinality = [c for c in columns_with_high_cardinality if c not in self.generate_features]
1340
+ columns_with_high_cardinality = [
1341
+ c for c in columns_with_high_cardinality if c not in (self.generate_features or [])
1342
+ ]
1341
1343
  self.logger.info(
1342
1344
  f"Columns {columns_with_high_cardinality} will be dropped for metrics calculation due to high cardinality"
1343
1345
  )
@@ -416,11 +416,12 @@ class CatBoostWrapper(EstimatorWrapper):
416
416
  if len(self.emb_features) > 3: # There is no reason to reduce embeddings dimension with less than 4
417
417
  X, embedding_features = self.group_embeddings(X)
418
418
  params["embedding_features"] = embedding_features
419
+ else:
420
+ self.emb_features = []
419
421
 
420
422
  # Find text features from passed in generate_features
421
423
  if self.text_features is not None:
422
424
  self.text_features = [f for f in self.text_features if not is_numeric_dtype(X[f])]
423
-
424
425
  params["text_features"] = self.text_features
425
426
 
426
427
  # Find rest categorical features
@@ -464,7 +465,6 @@ class CatBoostWrapper(EstimatorWrapper):
464
465
  df = df.copy()
465
466
  df[self.emb_features] = df[self.emb_features].fillna(0.0)
466
467
  df[emb_name] = df[self.emb_features].values.tolist()
467
- # TODO drop by condition
468
468
  df = df.drop(columns=self.emb_features)
469
469
 
470
470
  return df, [emb_name]
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: upgini
3
- Version: 1.1.244a16
3
+ Version: 1.1.244a18
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Home-page: https://upgini.com/
6
6
  Author: Upgini Developers
File without changes
File without changes
File without changes
File without changes