upgini 1.2.52a2__py3-none-any.whl → 1.2.54__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- upgini/__about__.py +1 -1
- upgini/features_enricher.py +1 -1
- upgini/http.py +4 -1
- upgini/metadata.py +24 -22
- {upgini-1.2.52a2.dist-info → upgini-1.2.54.dist-info}/METADATA +1 -1
- {upgini-1.2.52a2.dist-info → upgini-1.2.54.dist-info}/RECORD +8 -8
- {upgini-1.2.52a2.dist-info → upgini-1.2.54.dist-info}/WHEEL +0 -0
- {upgini-1.2.52a2.dist-info → upgini-1.2.54.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "1.2.
|
|
1
|
+
__version__ = "1.2.54"
|
upgini/features_enricher.py
CHANGED
|
@@ -268,7 +268,7 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
268
268
|
self.eval_set: Optional[List[Tuple]] = None
|
|
269
269
|
self.autodetected_search_keys: Dict[str, SearchKey] = {}
|
|
270
270
|
self.imbalanced = False
|
|
271
|
-
self.fit_select_features =
|
|
271
|
+
self.fit_select_features = True
|
|
272
272
|
self.__cached_sampled_datasets: Dict[str, Tuple[pd.DataFrame, pd.DataFrame, pd.Series, Dict, Dict, Dict]] = (
|
|
273
273
|
dict()
|
|
274
274
|
)
|
upgini/http.py
CHANGED
|
@@ -358,7 +358,10 @@ class _RestClient:
|
|
|
358
358
|
self._syncronized_refresh_access_token()
|
|
359
359
|
return request()
|
|
360
360
|
except HttpError as e:
|
|
361
|
-
if
|
|
361
|
+
if e.status_code == 429:
|
|
362
|
+
time.sleep(random.randint(1, 10))
|
|
363
|
+
return self._with_unauth_retry(request, try_number)
|
|
364
|
+
if e.status_code >= 500 and try_number < 3:
|
|
362
365
|
time.sleep(random.randint(1, 10))
|
|
363
366
|
return self._with_unauth_retry(request, try_number + 1)
|
|
364
367
|
elif e.status_code == 400 and "MD5Exception".lower() in e.message.lower() and try_number < 3:
|
upgini/metadata.py
CHANGED
|
@@ -89,7 +89,7 @@ class SearchKey(Enum):
|
|
|
89
89
|
if meaning_type == FileColumnMeaningType.EMAIL:
|
|
90
90
|
return SearchKey.EMAIL
|
|
91
91
|
if meaning_type == FileColumnMeaningType.HEM:
|
|
92
|
-
return SearchKey.HEM
|
|
92
|
+
return SearchKey.HEM # TODO check that it wasn't EMAIL
|
|
93
93
|
if meaning_type == FileColumnMeaningType.IP_ADDRESS:
|
|
94
94
|
return SearchKey.IP
|
|
95
95
|
if meaning_type == FileColumnMeaningType.MSISDN:
|
|
@@ -105,27 +105,27 @@ class SearchKey(Enum):
|
|
|
105
105
|
if meaning_type == FileColumnMeaningType.POSTAL_CODE:
|
|
106
106
|
return SearchKey.POSTAL_CODE
|
|
107
107
|
if meaning_type == FileColumnMeaningType.IPV6_ADDRESS:
|
|
108
|
-
return SearchKey.
|
|
109
|
-
if meaning_type == FileColumnMeaningType.IPV6_RANGE_FROM:
|
|
110
|
-
|
|
111
|
-
if meaning_type == FileColumnMeaningType.IPV6_RANGE_TO:
|
|
112
|
-
|
|
113
|
-
if meaning_type == FileColumnMeaningType.EMAIL_ONE_DOMAIN:
|
|
114
|
-
|
|
115
|
-
if meaning_type == FileColumnMeaningType.IP_RANGE_FROM:
|
|
116
|
-
|
|
117
|
-
if meaning_type == FileColumnMeaningType.IP_RANGE_TO:
|
|
118
|
-
|
|
119
|
-
if meaning_type == FileColumnMeaningType.MSISDN_RANGE_FROM:
|
|
120
|
-
|
|
121
|
-
if meaning_type == FileColumnMeaningType.MSISDN_RANGE_TO:
|
|
122
|
-
|
|
108
|
+
return SearchKey.IP
|
|
109
|
+
# if meaning_type == FileColumnMeaningType.IPV6_RANGE_FROM:
|
|
110
|
+
# return SearchKey.IPV6_RANGE_FROM
|
|
111
|
+
# if meaning_type == FileColumnMeaningType.IPV6_RANGE_TO:
|
|
112
|
+
# return SearchKey.IPV6_RANGE_TO
|
|
113
|
+
# if meaning_type == FileColumnMeaningType.EMAIL_ONE_DOMAIN:
|
|
114
|
+
# return SearchKey.EMAIL_ONE_DOMAIN
|
|
115
|
+
# if meaning_type == FileColumnMeaningType.IP_RANGE_FROM:
|
|
116
|
+
# return SearchKey.IP_RANGE_FROM
|
|
117
|
+
# if meaning_type == FileColumnMeaningType.IP_RANGE_TO:
|
|
118
|
+
# return SearchKey.IP_RANGE_TO
|
|
119
|
+
# if meaning_type == FileColumnMeaningType.MSISDN_RANGE_FROM:
|
|
120
|
+
# return SearchKey.MSISDN_RANGE_FROM
|
|
121
|
+
# if meaning_type == FileColumnMeaningType.MSISDN_RANGE_TO:
|
|
122
|
+
# return SearchKey.MSISDN_RANGE_TO
|
|
123
123
|
if meaning_type == FileColumnMeaningType.IP_BINARY:
|
|
124
|
-
return SearchKey.
|
|
125
|
-
if meaning_type == FileColumnMeaningType.IP_RANGE_FROM_BINARY:
|
|
126
|
-
|
|
127
|
-
if meaning_type == FileColumnMeaningType.IP_RANGE_TO_BINARY:
|
|
128
|
-
|
|
124
|
+
return SearchKey.IP
|
|
125
|
+
# if meaning_type == FileColumnMeaningType.IP_RANGE_FROM_BINARY:
|
|
126
|
+
# return SearchKey.IP_RANGE_FROM_BINARY
|
|
127
|
+
# if meaning_type == FileColumnMeaningType.IP_RANGE_TO_BINARY:
|
|
128
|
+
# return SearchKey.IP_RANGE_TO_BINARY
|
|
129
129
|
|
|
130
130
|
@staticmethod
|
|
131
131
|
def find_key(search_keys: Dict[str, SearchKey], keys: Union[SearchKey, List[SearchKey]]) -> Optional[SearchKey]:
|
|
@@ -249,7 +249,9 @@ class FileMetadata(BaseModel):
|
|
|
249
249
|
for key in keys_group:
|
|
250
250
|
column = self.column_by_name(key)
|
|
251
251
|
if column:
|
|
252
|
-
|
|
252
|
+
search_key = SearchKey.from_meaning_type(column.meaningType)
|
|
253
|
+
if search_key is not None:
|
|
254
|
+
search_keys[search_key] = column.name
|
|
253
255
|
return search_keys
|
|
254
256
|
|
|
255
257
|
|
|
@@ -1,12 +1,12 @@
|
|
|
1
|
-
upgini/__about__.py,sha256=
|
|
1
|
+
upgini/__about__.py,sha256=odKPoW2Uo_GtuB_RtRePNSus8XWCbeAFRoczr8nT784,23
|
|
2
2
|
upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
|
|
3
3
|
upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
|
|
4
4
|
upgini/dataset.py,sha256=vT4JyHmafLNbj54SySXr93f5hNS6-t94aFslbBy-7No,33535
|
|
5
5
|
upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
|
|
6
|
-
upgini/features_enricher.py,sha256=
|
|
7
|
-
upgini/http.py,sha256=
|
|
6
|
+
upgini/features_enricher.py,sha256=RDdzFJKBOg9ZT1fbOFMFOMn7O_gbG_8bvbUeNywHOl4,200627
|
|
7
|
+
upgini/http.py,sha256=ud0Cp7h0jNeHuuZGpU_1dAAEiabGoJjGxc1X5oeBQr4,43496
|
|
8
8
|
upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
|
|
9
|
-
upgini/metadata.py,sha256
|
|
9
|
+
upgini/metadata.py,sha256=Jh6YTaS00m_nbaOY_owvlSyn9zgkErkqu8iTr9ZjKI8,12279
|
|
10
10
|
upgini/metrics.py,sha256=hr7UwLphbZ_FEglLuO2lzr_pFgxOJ4c3WBeg7H-fNqY,35521
|
|
11
11
|
upgini/search_task.py,sha256=qxUxAD-bed-FpZYmTB_4orW7YJsW_O6a1TcgnZIRFr4,17307
|
|
12
12
|
upgini/spinner.py,sha256=4iMd-eIe_BnkqFEMIliULTbj6rNI2HkN_VJ4qYe0cUc,1118
|
|
@@ -59,7 +59,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
|
|
|
59
59
|
upgini/utils/target_utils.py,sha256=RlpKGss9kMibVSlA8iZuO_qxmyeplqzn7X8g6hiGGGs,14341
|
|
60
60
|
upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
|
|
61
61
|
upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
|
|
62
|
-
upgini-1.2.
|
|
63
|
-
upgini-1.2.
|
|
64
|
-
upgini-1.2.
|
|
65
|
-
upgini-1.2.
|
|
62
|
+
upgini-1.2.54.dist-info/METADATA,sha256=UsKRAySU92ST26c9W_bfCOMEYHBNOQTweVVeL4mfA9I,49055
|
|
63
|
+
upgini-1.2.54.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
|
|
64
|
+
upgini-1.2.54.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
|
|
65
|
+
upgini-1.2.54.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|