upgini 1.1.301__tar.gz → 1.1.303__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (65) hide show
  1. {upgini-1.1.301 → upgini-1.1.303}/PKG-INFO +1 -1
  2. upgini-1.1.303/src/upgini/__about__.py +1 -0
  3. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/data_source/data_source_publisher.py +3 -0
  4. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/features_enricher.py +3 -0
  5. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/metadata.py +1 -1
  6. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/resource_bundle/strings.properties +1 -0
  7. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/datetime_utils.py +5 -2
  8. upgini-1.1.301/src/upgini/__about__.py +0 -1
  9. {upgini-1.1.301 → upgini-1.1.303}/.gitignore +0 -0
  10. {upgini-1.1.301 → upgini-1.1.303}/LICENSE +0 -0
  11. {upgini-1.1.301 → upgini-1.1.303}/README.md +0 -0
  12. {upgini-1.1.301 → upgini-1.1.303}/pyproject.toml +0 -0
  13. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/__init__.py +0 -0
  14. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/ads.py +0 -0
  15. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/ads_management/__init__.py +0 -0
  16. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/ads_management/ads_manager.py +0 -0
  17. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/__init__.py +0 -0
  18. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/all_operands.py +0 -0
  19. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/binary.py +0 -0
  20. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/date.py +0 -0
  21. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/feature.py +0 -0
  22. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/groupby.py +0 -0
  23. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/operand.py +0 -0
  24. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/unary.py +0 -0
  25. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/autofe/vector.py +0 -0
  26. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/data_source/__init__.py +0 -0
  27. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/dataset.py +0 -0
  28. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/errors.py +0 -0
  29. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/http.py +0 -0
  30. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/lazy_import.py +0 -0
  31. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/mdc/__init__.py +0 -0
  32. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/mdc/context.py +0 -0
  33. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/metrics.py +0 -0
  34. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/normalizer/__init__.py +0 -0
  35. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/normalizer/phone_normalizer.py +0 -0
  36. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/resource_bundle/__init__.py +0 -0
  37. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/resource_bundle/exceptions.py +0 -0
  38. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/resource_bundle/strings_widget.properties +0 -0
  39. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/sampler/__init__.py +0 -0
  40. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/sampler/base.py +0 -0
  41. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/sampler/random_under_sampler.py +0 -0
  42. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/sampler/utils.py +0 -0
  43. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/search_task.py +0 -0
  44. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/spinner.py +0 -0
  45. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/__init__.py +0 -0
  46. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/base_search_key_detector.py +0 -0
  47. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/blocked_time_series.py +0 -0
  48. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/country_utils.py +0 -0
  49. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/custom_loss_utils.py +0 -0
  50. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/cv_utils.py +0 -0
  51. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/deduplicate_utils.py +0 -0
  52. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/display_utils.py +0 -0
  53. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/email_utils.py +0 -0
  54. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/fallback_progress_bar.py +0 -0
  55. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/features_validator.py +0 -0
  56. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/format.py +0 -0
  57. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/ip_utils.py +0 -0
  58. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/phone_utils.py +0 -0
  59. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/postal_code_utils.py +0 -0
  60. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/progress_bar.py +0 -0
  61. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/sklearn_ext.py +0 -0
  62. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/target_utils.py +0 -0
  63. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/track_info.py +0 -0
  64. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/utils/warning_counter.py +0 -0
  65. {upgini-1.1.301 → upgini-1.1.303}/src/upgini/version_validator.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.1.301
3
+ Version: 1.1.303
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -0,0 +1 @@
1
+ __version__ = "1.1.303"
@@ -82,6 +82,9 @@ class DataSourcePublisher:
82
82
 
83
83
  date_format - optional str - format of date if it is present in search keys
84
84
 
85
+ features_for_embeddings - optional list of str - list of features that should be used for GPT features
86
+ generation
87
+
85
88
  ...
86
89
 
87
90
  data_table_id_to_replace - optional str - id of registered ADS that should be replaced by new table
@@ -3483,6 +3483,9 @@ class FeaturesEnricher(TransformerMixin):
3483
3483
  is_transform=False,
3484
3484
  silent_mode=False,
3485
3485
  ):
3486
+ for _, key_type in search_keys.items():
3487
+ if not isinstance(key_type, SearchKey):
3488
+ raise ValidationError(self.bundle.get("unsupported_type_of_search_key").format(key_type))
3486
3489
  valid_search_keys = {}
3487
3490
  unsupported_search_keys = {
3488
3491
  SearchKey.IP_RANGE_FROM,
@@ -191,7 +191,7 @@ class FileColumnMetadata(BaseModel):
191
191
  # is this column contains keys from multiple key columns like msisdn1, msisdn2
192
192
  isUnnest: bool = False
193
193
  # list of original etalon key column names like msisdn1, msisdn2
194
- unnestKeyNames: Optional[list[str]]
194
+ unnestKeyNames: Optional[List[str]]
195
195
 
196
196
 
197
197
  class FileMetadata(BaseModel):
@@ -85,6 +85,7 @@ unregistered_only_personal_keys=Only personal search keys used. Api_key from pro
85
85
  search_key_not_found=Column `{}` from search_keys was not found in X dataframe: {}
86
86
  numeric_search_key_not_found=Index {} in search_keys is out of bounds for {} columns of X dataframe
87
87
  unsupported_search_key_type=Unsupported type of key in search_keys: {}
88
+ unsupported_type_of_search_key=Unsupported type of search key: {}. It should be a member of SearcKey
88
89
  search_key_country_and_country_code=\nWARNING: SearchKey.COUNTRY and country_code parameter were passed simultaniously. Parameter country_code will be ignored
89
90
  empty_search_key=Search key {} is empty. Please fill values or remove this search key
90
91
  single_constant_search_key=\nWARNING: Constant value detected for the {} search key in the X dataframe: {}.\nThat search key will add constant features for different y values.\nPlease add extra search keys with non constant values, like the COUNTRY, POSTAL_CODE, DATE, PHONE NUMBER, EMAIL/HEM or IPv4
@@ -31,7 +31,7 @@ DATE_FORMATS = [
31
31
  "%Y-%m-%dT%H:%M:%S.%f",
32
32
  ]
33
33
 
34
- DATETIME_PATTERN = r"^[\d\s\.\-:T]+$"
34
+ DATETIME_PATTERN = r"^[\d\s\.\-:T/]+$"
35
35
 
36
36
 
37
37
  class DateTimeSearchKeyConverter:
@@ -147,7 +147,10 @@ class DateTimeSearchKeyConverter:
147
147
  return pd.to_datetime(df[self.date_column], format=date_format)
148
148
  except ValueError:
149
149
  pass
150
- raise ValidationError(self.bundle.get("invalid_date_format").format(self.date_column))
150
+ try:
151
+ return pd.to_datetime(df[self.date_column])
152
+ except ValueError:
153
+ raise ValidationError(self.bundle.get("invalid_date_format").format(self.date_column))
151
154
 
152
155
 
153
156
  def is_time_series(df: pd.DataFrame, date_col: str) -> bool:
@@ -1 +0,0 @@
1
- __version__ = "1.1.301"
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes