upgini 1.1.301__py3-none-any.whl → 1.1.303__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- upgini/__about__.py +1 -1
- upgini/data_source/data_source_publisher.py +3 -0
- upgini/features_enricher.py +3 -0
- upgini/metadata.py +1 -1
- upgini/resource_bundle/strings.properties +1 -0
- upgini/utils/datetime_utils.py +5 -2
- {upgini-1.1.301.dist-info → upgini-1.1.303.dist-info}/METADATA +1 -1
- {upgini-1.1.301.dist-info → upgini-1.1.303.dist-info}/RECORD +10 -10
- {upgini-1.1.301.dist-info → upgini-1.1.303.dist-info}/WHEEL +0 -0
- {upgini-1.1.301.dist-info → upgini-1.1.303.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "1.1.
|
|
1
|
+
__version__ = "1.1.303"
|
|
@@ -82,6 +82,9 @@ class DataSourcePublisher:
|
|
|
82
82
|
|
|
83
83
|
date_format - optional str - format of date if it is present in search keys
|
|
84
84
|
|
|
85
|
+
features_for_embeddings - optional list of str - list of features that should be used for GPT features
|
|
86
|
+
generation
|
|
87
|
+
|
|
85
88
|
...
|
|
86
89
|
|
|
87
90
|
data_table_id_to_replace - optional str - id of registered ADS that should be replaced by new table
|
upgini/features_enricher.py
CHANGED
|
@@ -3483,6 +3483,9 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
3483
3483
|
is_transform=False,
|
|
3484
3484
|
silent_mode=False,
|
|
3485
3485
|
):
|
|
3486
|
+
for _, key_type in search_keys.items():
|
|
3487
|
+
if not isinstance(key_type, SearchKey):
|
|
3488
|
+
raise ValidationError(self.bundle.get("unsupported_type_of_search_key").format(key_type))
|
|
3486
3489
|
valid_search_keys = {}
|
|
3487
3490
|
unsupported_search_keys = {
|
|
3488
3491
|
SearchKey.IP_RANGE_FROM,
|
upgini/metadata.py
CHANGED
|
@@ -191,7 +191,7 @@ class FileColumnMetadata(BaseModel):
|
|
|
191
191
|
# is this column contains keys from multiple key columns like msisdn1, msisdn2
|
|
192
192
|
isUnnest: bool = False
|
|
193
193
|
# list of original etalon key column names like msisdn1, msisdn2
|
|
194
|
-
unnestKeyNames: Optional[
|
|
194
|
+
unnestKeyNames: Optional[List[str]]
|
|
195
195
|
|
|
196
196
|
|
|
197
197
|
class FileMetadata(BaseModel):
|
|
@@ -85,6 +85,7 @@ unregistered_only_personal_keys=Only personal search keys used. Api_key from pro
|
|
|
85
85
|
search_key_not_found=Column `{}` from search_keys was not found in X dataframe: {}
|
|
86
86
|
numeric_search_key_not_found=Index {} in search_keys is out of bounds for {} columns of X dataframe
|
|
87
87
|
unsupported_search_key_type=Unsupported type of key in search_keys: {}
|
|
88
|
+
unsupported_type_of_search_key=Unsupported type of search key: {}. It should be a member of SearcKey
|
|
88
89
|
search_key_country_and_country_code=\nWARNING: SearchKey.COUNTRY and country_code parameter were passed simultaniously. Parameter country_code will be ignored
|
|
89
90
|
empty_search_key=Search key {} is empty. Please fill values or remove this search key
|
|
90
91
|
single_constant_search_key=\nWARNING: Constant value detected for the {} search key in the X dataframe: {}.\nThat search key will add constant features for different y values.\nPlease add extra search keys with non constant values, like the COUNTRY, POSTAL_CODE, DATE, PHONE NUMBER, EMAIL/HEM or IPv4
|
upgini/utils/datetime_utils.py
CHANGED
|
@@ -31,7 +31,7 @@ DATE_FORMATS = [
|
|
|
31
31
|
"%Y-%m-%dT%H:%M:%S.%f",
|
|
32
32
|
]
|
|
33
33
|
|
|
34
|
-
DATETIME_PATTERN = r"^[\d\s\.\-:T]+$"
|
|
34
|
+
DATETIME_PATTERN = r"^[\d\s\.\-:T/]+$"
|
|
35
35
|
|
|
36
36
|
|
|
37
37
|
class DateTimeSearchKeyConverter:
|
|
@@ -147,7 +147,10 @@ class DateTimeSearchKeyConverter:
|
|
|
147
147
|
return pd.to_datetime(df[self.date_column], format=date_format)
|
|
148
148
|
except ValueError:
|
|
149
149
|
pass
|
|
150
|
-
|
|
150
|
+
try:
|
|
151
|
+
return pd.to_datetime(df[self.date_column])
|
|
152
|
+
except ValueError:
|
|
153
|
+
raise ValidationError(self.bundle.get("invalid_date_format").format(self.date_column))
|
|
151
154
|
|
|
152
155
|
|
|
153
156
|
def is_time_series(df: pd.DataFrame, date_col: str) -> bool:
|
|
@@ -1,12 +1,12 @@
|
|
|
1
|
-
upgini/__about__.py,sha256=
|
|
1
|
+
upgini/__about__.py,sha256=DZ-j6x_TqRaD5W2xKCfhOLDmhOQuGblZWwKIzlYBLkg,24
|
|
2
2
|
upgini/__init__.py,sha256=ObEtjFkIssl83qeKNMLpIQygfwK8TzztwiI43YTsAP0,353
|
|
3
3
|
upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
|
|
4
4
|
upgini/dataset.py,sha256=MOzBVsvzlHLxNfPWtMaXC_jIPeW7_gUvbSGeXnsPgNI,46158
|
|
5
5
|
upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
|
|
6
|
-
upgini/features_enricher.py,sha256=
|
|
6
|
+
upgini/features_enricher.py,sha256=PRiQGAmnm9jPXN4Uqus5l8RQIPAWPxsIBnIoEMnh6g8,183342
|
|
7
7
|
upgini/http.py,sha256=bp6jWl422Icy3AhHMdCcJv5NjExE45gSMmzMTPJjPuk,42600
|
|
8
8
|
upgini/lazy_import.py,sha256=EwoM0msNGbSmWBhGbrLDny1DSnOlvTxCjmMKPxYlDms,610
|
|
9
|
-
upgini/metadata.py,sha256=
|
|
9
|
+
upgini/metadata.py,sha256=E5WWZ_MkjGyYNQh_LnwMIBHyqPx1fxk-qhEfQIJnzq8,10209
|
|
10
10
|
upgini/metrics.py,sha256=Tu5cN8RlhOSSMWUTXRSkdl8SWBqR1N_2eJpBum9pZxc,30926
|
|
11
11
|
upgini/search_task.py,sha256=LtRJ9bCPjMo1gJ-sUDKERhDwGcWKImrzwVFHjkMSQHQ,17071
|
|
12
12
|
upgini/spinner.py,sha256=4iMd-eIe_BnkqFEMIliULTbj6rNI2HkN_VJ4qYe0cUc,1118
|
|
@@ -23,14 +23,14 @@ upgini/autofe/operand.py,sha256=MKEsl3zxpWzRDpTkE0sNJxTu62U20sWOvEKhPjUWS6s,2915
|
|
|
23
23
|
upgini/autofe/unary.py,sha256=ZWjLd-CUkNt_PpM8YuWLLipW1v_RdBlsl4JxXIVo9aM,3652
|
|
24
24
|
upgini/autofe/vector.py,sha256=dLxfAstJs-gw_OQ1xxoxcM6pVzORlV0HVzdzt7cLXVQ,606
|
|
25
25
|
upgini/data_source/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
26
|
-
upgini/data_source/data_source_publisher.py,sha256=
|
|
26
|
+
upgini/data_source/data_source_publisher.py,sha256=aCVpZ3RGlYToRYYNHjC2BxIxnnKUyrrF29MncCXhVlE,19716
|
|
27
27
|
upgini/mdc/__init__.py,sha256=aM08nIWFc2gWdWUa3_IuEnNND0cQPkBGnYpRMnfFN8k,1019
|
|
28
28
|
upgini/mdc/context.py,sha256=3u1B-jXt7tXEvNcV3qmR9SDCseudnY7KYsLclBdwVLk,1405
|
|
29
29
|
upgini/normalizer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
30
30
|
upgini/normalizer/phone_normalizer.py,sha256=EzTaahk6myRv6ZXgbyVFGY4kpo_2VlQgOrm5_lfbmNI,9996
|
|
31
31
|
upgini/resource_bundle/__init__.py,sha256=S5F2G47pnJd2LDpmFsjDqEwiKkP8Hm-hcseDbMka6Ko,8345
|
|
32
32
|
upgini/resource_bundle/exceptions.py,sha256=5fRvx0_vWdE1-7HcSgF0tckB4A9AKyf5RiinZkInTsI,621
|
|
33
|
-
upgini/resource_bundle/strings.properties,sha256=
|
|
33
|
+
upgini/resource_bundle/strings.properties,sha256=WZAuYPX2Dpn6BHoA3RX8uvMNMr-yJE2fF7Gz0i24x2s,26459
|
|
34
34
|
upgini/resource_bundle/strings_widget.properties,sha256=gOdqvZWntP2LCza_tyVk1_yRYcG4c04K9sQOAVhF_gw,1577
|
|
35
35
|
upgini/sampler/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
36
36
|
upgini/sampler/base.py,sha256=7GpjYqjOp58vYcJLiX__1R5wjUlyQbxvHJ2klFnup_M,6389
|
|
@@ -42,7 +42,7 @@ upgini/utils/blocked_time_series.py,sha256=Uqr3vp4YqNclj2-PzEYqVy763GSXHn86sbpIl
|
|
|
42
42
|
upgini/utils/country_utils.py,sha256=yE8oRgMpXuJxPfQm4fioY6dg6700HgVnHSk4Cv9sUyM,6511
|
|
43
43
|
upgini/utils/custom_loss_utils.py,sha256=kieNZYBYZm5ZGBltF1F_jOSF4ea6C29rYuCyiDcqVNY,3857
|
|
44
44
|
upgini/utils/cv_utils.py,sha256=w6FQb9nO8BWDx88EF83NpjPLarK4eR4ia0Wg0kLBJC4,3525
|
|
45
|
-
upgini/utils/datetime_utils.py,sha256=
|
|
45
|
+
upgini/utils/datetime_utils.py,sha256=uJ3wJNr4KQvDJ-gSOLcmP85hLtASK271o6mob4aZT90,11064
|
|
46
46
|
upgini/utils/deduplicate_utils.py,sha256=Zvs7zW4QzaERQmJNPrTVf2ZTVBkBLOycFCzyMwtXuV8,8770
|
|
47
47
|
upgini/utils/display_utils.py,sha256=A2ouB5eiZ-Kyt9ykYxkLQwyoRPrdYeJymwNTiajtFXs,10990
|
|
48
48
|
upgini/utils/email_utils.py,sha256=aKHa4xVBSsEsiZtFCPj_DrUaFupceYfvJeP_e8w_D5E,3813
|
|
@@ -57,7 +57,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
|
|
|
57
57
|
upgini/utils/target_utils.py,sha256=Y96_PJ5cC-WsEbeqg20v9uqywDQobLoTb-xoP7S3o4E,7807
|
|
58
58
|
upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
|
|
59
59
|
upgini/utils/warning_counter.py,sha256=dIWBB4dI5XRRJZudvIlqlIYKEiwLLPcXarsZuYRt338,227
|
|
60
|
-
upgini-1.1.
|
|
61
|
-
upgini-1.1.
|
|
62
|
-
upgini-1.1.
|
|
63
|
-
upgini-1.1.
|
|
60
|
+
upgini-1.1.303.dist-info/METADATA,sha256=4RboHCgNVmHfmPnjut5UyMzn9qd7AMlCsBWnfk8QD0s,48153
|
|
61
|
+
upgini-1.1.303.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
|
|
62
|
+
upgini-1.1.303.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
|
|
63
|
+
upgini-1.1.303.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|