upgini 1.1.301__py3-none-any.whl → 1.1.303__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.1.301"
1
+ __version__ = "1.1.303"
@@ -82,6 +82,9 @@ class DataSourcePublisher:
82
82
 
83
83
  date_format - optional str - format of date if it is present in search keys
84
84
 
85
+ features_for_embeddings - optional list of str - list of features that should be used for GPT features
86
+ generation
87
+
85
88
  ...
86
89
 
87
90
  data_table_id_to_replace - optional str - id of registered ADS that should be replaced by new table
@@ -3483,6 +3483,9 @@ class FeaturesEnricher(TransformerMixin):
3483
3483
  is_transform=False,
3484
3484
  silent_mode=False,
3485
3485
  ):
3486
+ for _, key_type in search_keys.items():
3487
+ if not isinstance(key_type, SearchKey):
3488
+ raise ValidationError(self.bundle.get("unsupported_type_of_search_key").format(key_type))
3486
3489
  valid_search_keys = {}
3487
3490
  unsupported_search_keys = {
3488
3491
  SearchKey.IP_RANGE_FROM,
upgini/metadata.py CHANGED
@@ -191,7 +191,7 @@ class FileColumnMetadata(BaseModel):
191
191
  # is this column contains keys from multiple key columns like msisdn1, msisdn2
192
192
  isUnnest: bool = False
193
193
  # list of original etalon key column names like msisdn1, msisdn2
194
- unnestKeyNames: Optional[list[str]]
194
+ unnestKeyNames: Optional[List[str]]
195
195
 
196
196
 
197
197
  class FileMetadata(BaseModel):
@@ -85,6 +85,7 @@ unregistered_only_personal_keys=Only personal search keys used. Api_key from pro
85
85
  search_key_not_found=Column `{}` from search_keys was not found in X dataframe: {}
86
86
  numeric_search_key_not_found=Index {} in search_keys is out of bounds for {} columns of X dataframe
87
87
  unsupported_search_key_type=Unsupported type of key in search_keys: {}
88
+ unsupported_type_of_search_key=Unsupported type of search key: {}. It should be a member of SearcKey
88
89
  search_key_country_and_country_code=\nWARNING: SearchKey.COUNTRY and country_code parameter were passed simultaniously. Parameter country_code will be ignored
89
90
  empty_search_key=Search key {} is empty. Please fill values or remove this search key
90
91
  single_constant_search_key=\nWARNING: Constant value detected for the {} search key in the X dataframe: {}.\nThat search key will add constant features for different y values.\nPlease add extra search keys with non constant values, like the COUNTRY, POSTAL_CODE, DATE, PHONE NUMBER, EMAIL/HEM or IPv4
@@ -31,7 +31,7 @@ DATE_FORMATS = [
31
31
  "%Y-%m-%dT%H:%M:%S.%f",
32
32
  ]
33
33
 
34
- DATETIME_PATTERN = r"^[\d\s\.\-:T]+$"
34
+ DATETIME_PATTERN = r"^[\d\s\.\-:T/]+$"
35
35
 
36
36
 
37
37
  class DateTimeSearchKeyConverter:
@@ -147,7 +147,10 @@ class DateTimeSearchKeyConverter:
147
147
  return pd.to_datetime(df[self.date_column], format=date_format)
148
148
  except ValueError:
149
149
  pass
150
- raise ValidationError(self.bundle.get("invalid_date_format").format(self.date_column))
150
+ try:
151
+ return pd.to_datetime(df[self.date_column])
152
+ except ValueError:
153
+ raise ValidationError(self.bundle.get("invalid_date_format").format(self.date_column))
151
154
 
152
155
 
153
156
  def is_time_series(df: pd.DataFrame, date_col: str) -> bool:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.1.301
3
+ Version: 1.1.303
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -1,12 +1,12 @@
1
- upgini/__about__.py,sha256=L11AcDL4xom7Zln7UryeDX6XjWGUw7VdTIlPlnfMwTc,24
1
+ upgini/__about__.py,sha256=DZ-j6x_TqRaD5W2xKCfhOLDmhOQuGblZWwKIzlYBLkg,24
2
2
  upgini/__init__.py,sha256=ObEtjFkIssl83qeKNMLpIQygfwK8TzztwiI43YTsAP0,353
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=MOzBVsvzlHLxNfPWtMaXC_jIPeW7_gUvbSGeXnsPgNI,46158
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=OW3aQ0vyaKMrxWBhptdvb_SAxNqf7H6jssOFdfW20mc,183136
6
+ upgini/features_enricher.py,sha256=PRiQGAmnm9jPXN4Uqus5l8RQIPAWPxsIBnIoEMnh6g8,183342
7
7
  upgini/http.py,sha256=bp6jWl422Icy3AhHMdCcJv5NjExE45gSMmzMTPJjPuk,42600
8
8
  upgini/lazy_import.py,sha256=EwoM0msNGbSmWBhGbrLDny1DSnOlvTxCjmMKPxYlDms,610
9
- upgini/metadata.py,sha256=wOFCJruDBhC4Hiiiqf8GeHZnnm6rhJy8t6fg5B0Z4TQ,10209
9
+ upgini/metadata.py,sha256=E5WWZ_MkjGyYNQh_LnwMIBHyqPx1fxk-qhEfQIJnzq8,10209
10
10
  upgini/metrics.py,sha256=Tu5cN8RlhOSSMWUTXRSkdl8SWBqR1N_2eJpBum9pZxc,30926
11
11
  upgini/search_task.py,sha256=LtRJ9bCPjMo1gJ-sUDKERhDwGcWKImrzwVFHjkMSQHQ,17071
12
12
  upgini/spinner.py,sha256=4iMd-eIe_BnkqFEMIliULTbj6rNI2HkN_VJ4qYe0cUc,1118
@@ -23,14 +23,14 @@ upgini/autofe/operand.py,sha256=MKEsl3zxpWzRDpTkE0sNJxTu62U20sWOvEKhPjUWS6s,2915
23
23
  upgini/autofe/unary.py,sha256=ZWjLd-CUkNt_PpM8YuWLLipW1v_RdBlsl4JxXIVo9aM,3652
24
24
  upgini/autofe/vector.py,sha256=dLxfAstJs-gw_OQ1xxoxcM6pVzORlV0HVzdzt7cLXVQ,606
25
25
  upgini/data_source/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
26
- upgini/data_source/data_source_publisher.py,sha256=1cQZrK630VztwGGDp41ec9gqIeUtkefaqSSQEitVWiM,19581
26
+ upgini/data_source/data_source_publisher.py,sha256=aCVpZ3RGlYToRYYNHjC2BxIxnnKUyrrF29MncCXhVlE,19716
27
27
  upgini/mdc/__init__.py,sha256=aM08nIWFc2gWdWUa3_IuEnNND0cQPkBGnYpRMnfFN8k,1019
28
28
  upgini/mdc/context.py,sha256=3u1B-jXt7tXEvNcV3qmR9SDCseudnY7KYsLclBdwVLk,1405
29
29
  upgini/normalizer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
30
30
  upgini/normalizer/phone_normalizer.py,sha256=EzTaahk6myRv6ZXgbyVFGY4kpo_2VlQgOrm5_lfbmNI,9996
31
31
  upgini/resource_bundle/__init__.py,sha256=S5F2G47pnJd2LDpmFsjDqEwiKkP8Hm-hcseDbMka6Ko,8345
32
32
  upgini/resource_bundle/exceptions.py,sha256=5fRvx0_vWdE1-7HcSgF0tckB4A9AKyf5RiinZkInTsI,621
33
- upgini/resource_bundle/strings.properties,sha256=6jYqcxj06ZopXwr5YYMGXX1QiNNJNFo2SuwAR0qleRk,26358
33
+ upgini/resource_bundle/strings.properties,sha256=WZAuYPX2Dpn6BHoA3RX8uvMNMr-yJE2fF7Gz0i24x2s,26459
34
34
  upgini/resource_bundle/strings_widget.properties,sha256=gOdqvZWntP2LCza_tyVk1_yRYcG4c04K9sQOAVhF_gw,1577
35
35
  upgini/sampler/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
36
36
  upgini/sampler/base.py,sha256=7GpjYqjOp58vYcJLiX__1R5wjUlyQbxvHJ2klFnup_M,6389
@@ -42,7 +42,7 @@ upgini/utils/blocked_time_series.py,sha256=Uqr3vp4YqNclj2-PzEYqVy763GSXHn86sbpIl
42
42
  upgini/utils/country_utils.py,sha256=yE8oRgMpXuJxPfQm4fioY6dg6700HgVnHSk4Cv9sUyM,6511
43
43
  upgini/utils/custom_loss_utils.py,sha256=kieNZYBYZm5ZGBltF1F_jOSF4ea6C29rYuCyiDcqVNY,3857
44
44
  upgini/utils/cv_utils.py,sha256=w6FQb9nO8BWDx88EF83NpjPLarK4eR4ia0Wg0kLBJC4,3525
45
- upgini/utils/datetime_utils.py,sha256=Ujmu1ouwSFtG5SywQXJlmtDnGigAnIWPdE5Vx5NvgUM,10951
45
+ upgini/utils/datetime_utils.py,sha256=uJ3wJNr4KQvDJ-gSOLcmP85hLtASK271o6mob4aZT90,11064
46
46
  upgini/utils/deduplicate_utils.py,sha256=Zvs7zW4QzaERQmJNPrTVf2ZTVBkBLOycFCzyMwtXuV8,8770
47
47
  upgini/utils/display_utils.py,sha256=A2ouB5eiZ-Kyt9ykYxkLQwyoRPrdYeJymwNTiajtFXs,10990
48
48
  upgini/utils/email_utils.py,sha256=aKHa4xVBSsEsiZtFCPj_DrUaFupceYfvJeP_e8w_D5E,3813
@@ -57,7 +57,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
57
57
  upgini/utils/target_utils.py,sha256=Y96_PJ5cC-WsEbeqg20v9uqywDQobLoTb-xoP7S3o4E,7807
58
58
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
59
59
  upgini/utils/warning_counter.py,sha256=dIWBB4dI5XRRJZudvIlqlIYKEiwLLPcXarsZuYRt338,227
60
- upgini-1.1.301.dist-info/METADATA,sha256=DzWKpZGrQ1cMxlEFVzE0GFg3Zl64sJvjYydjx4u6xhA,48153
61
- upgini-1.1.301.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
62
- upgini-1.1.301.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
63
- upgini-1.1.301.dist-info/RECORD,,
60
+ upgini-1.1.303.dist-info/METADATA,sha256=4RboHCgNVmHfmPnjut5UyMzn9qd7AMlCsBWnfk8QD0s,48153
61
+ upgini-1.1.303.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
62
+ upgini-1.1.303.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
63
+ upgini-1.1.303.dist-info/RECORD,,