upgini 1.2.52a2__py3-none-any.whl → 1.2.54__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.52a2"
1
+ __version__ = "1.2.54"
@@ -268,7 +268,7 @@ class FeaturesEnricher(TransformerMixin):
268
268
  self.eval_set: Optional[List[Tuple]] = None
269
269
  self.autodetected_search_keys: Dict[str, SearchKey] = {}
270
270
  self.imbalanced = False
271
- self.fit_select_features = False
271
+ self.fit_select_features = True
272
272
  self.__cached_sampled_datasets: Dict[str, Tuple[pd.DataFrame, pd.DataFrame, pd.Series, Dict, Dict, Dict]] = (
273
273
  dict()
274
274
  )
upgini/http.py CHANGED
@@ -358,7 +358,10 @@ class _RestClient:
358
358
  self._syncronized_refresh_access_token()
359
359
  return request()
360
360
  except HttpError as e:
361
- if (e.status_code == 429 or e.status_code >= 500) and try_number < 3:
361
+ if e.status_code == 429:
362
+ time.sleep(random.randint(1, 10))
363
+ return self._with_unauth_retry(request, try_number)
364
+ if e.status_code >= 500 and try_number < 3:
362
365
  time.sleep(random.randint(1, 10))
363
366
  return self._with_unauth_retry(request, try_number + 1)
364
367
  elif e.status_code == 400 and "MD5Exception".lower() in e.message.lower() and try_number < 3:
upgini/metadata.py CHANGED
@@ -89,7 +89,7 @@ class SearchKey(Enum):
89
89
  if meaning_type == FileColumnMeaningType.EMAIL:
90
90
  return SearchKey.EMAIL
91
91
  if meaning_type == FileColumnMeaningType.HEM:
92
- return SearchKey.HEM
92
+ return SearchKey.HEM # TODO check that it wasn't EMAIL
93
93
  if meaning_type == FileColumnMeaningType.IP_ADDRESS:
94
94
  return SearchKey.IP
95
95
  if meaning_type == FileColumnMeaningType.MSISDN:
@@ -105,27 +105,27 @@ class SearchKey(Enum):
105
105
  if meaning_type == FileColumnMeaningType.POSTAL_CODE:
106
106
  return SearchKey.POSTAL_CODE
107
107
  if meaning_type == FileColumnMeaningType.IPV6_ADDRESS:
108
- return SearchKey.IPV6_ADDRESS
109
- if meaning_type == FileColumnMeaningType.IPV6_RANGE_FROM:
110
- return SearchKey.IPV6_RANGE_FROM
111
- if meaning_type == FileColumnMeaningType.IPV6_RANGE_TO:
112
- return SearchKey.IPV6_RANGE_TO
113
- if meaning_type == FileColumnMeaningType.EMAIL_ONE_DOMAIN:
114
- return SearchKey.EMAIL_ONE_DOMAIN
115
- if meaning_type == FileColumnMeaningType.IP_RANGE_FROM:
116
- return SearchKey.IP_RANGE_FROM
117
- if meaning_type == FileColumnMeaningType.IP_RANGE_TO:
118
- return SearchKey.IP_RANGE_TO
119
- if meaning_type == FileColumnMeaningType.MSISDN_RANGE_FROM:
120
- return SearchKey.MSISDN_RANGE_FROM
121
- if meaning_type == FileColumnMeaningType.MSISDN_RANGE_TO:
122
- return SearchKey.MSISDN_RANGE_TO
108
+ return SearchKey.IP
109
+ # if meaning_type == FileColumnMeaningType.IPV6_RANGE_FROM:
110
+ # return SearchKey.IPV6_RANGE_FROM
111
+ # if meaning_type == FileColumnMeaningType.IPV6_RANGE_TO:
112
+ # return SearchKey.IPV6_RANGE_TO
113
+ # if meaning_type == FileColumnMeaningType.EMAIL_ONE_DOMAIN:
114
+ # return SearchKey.EMAIL_ONE_DOMAIN
115
+ # if meaning_type == FileColumnMeaningType.IP_RANGE_FROM:
116
+ # return SearchKey.IP_RANGE_FROM
117
+ # if meaning_type == FileColumnMeaningType.IP_RANGE_TO:
118
+ # return SearchKey.IP_RANGE_TO
119
+ # if meaning_type == FileColumnMeaningType.MSISDN_RANGE_FROM:
120
+ # return SearchKey.MSISDN_RANGE_FROM
121
+ # if meaning_type == FileColumnMeaningType.MSISDN_RANGE_TO:
122
+ # return SearchKey.MSISDN_RANGE_TO
123
123
  if meaning_type == FileColumnMeaningType.IP_BINARY:
124
- return SearchKey.IP_BINARY
125
- if meaning_type == FileColumnMeaningType.IP_RANGE_FROM_BINARY:
126
- return SearchKey.IP_RANGE_FROM_BINARY
127
- if meaning_type == FileColumnMeaningType.IP_RANGE_TO_BINARY:
128
- return SearchKey.IP_RANGE_TO_BINARY
124
+ return SearchKey.IP
125
+ # if meaning_type == FileColumnMeaningType.IP_RANGE_FROM_BINARY:
126
+ # return SearchKey.IP_RANGE_FROM_BINARY
127
+ # if meaning_type == FileColumnMeaningType.IP_RANGE_TO_BINARY:
128
+ # return SearchKey.IP_RANGE_TO_BINARY
129
129
 
130
130
  @staticmethod
131
131
  def find_key(search_keys: Dict[str, SearchKey], keys: Union[SearchKey, List[SearchKey]]) -> Optional[SearchKey]:
@@ -249,7 +249,9 @@ class FileMetadata(BaseModel):
249
249
  for key in keys_group:
250
250
  column = self.column_by_name(key)
251
251
  if column:
252
- search_keys[SearchKey.from_meaning_type(column.meaningType)] = column.name
252
+ search_key = SearchKey.from_meaning_type(column.meaningType)
253
+ if search_key is not None:
254
+ search_keys[search_key] = column.name
253
255
  return search_keys
254
256
 
255
257
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.52a2
3
+ Version: 1.2.54
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -1,12 +1,12 @@
1
- upgini/__about__.py,sha256=975QRO3wSYiniBo2LVNW4q4A5uoxrBhfbb6AFwD83g0,25
1
+ upgini/__about__.py,sha256=odKPoW2Uo_GtuB_RtRePNSus8XWCbeAFRoczr8nT784,23
2
2
  upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=vT4JyHmafLNbj54SySXr93f5hNS6-t94aFslbBy-7No,33535
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=mDpz2NcNBItvfdE2EllEetnv7-ApODXg0FQleYrGIfg,200628
7
- upgini/http.py,sha256=danPeX7nTMa_70S-pk-4UUm5yOvXYlR84jgyjoHYBkU,43367
6
+ upgini/features_enricher.py,sha256=RDdzFJKBOg9ZT1fbOFMFOMn7O_gbG_8bvbUeNywHOl4,200627
7
+ upgini/http.py,sha256=ud0Cp7h0jNeHuuZGpU_1dAAEiabGoJjGxc1X5oeBQr4,43496
8
8
  upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
9
- upgini/metadata.py,sha256=-bulW4ay0qxOxR4_5oDvENtgKiZgZI-QnU2stGHrKhg,12130
9
+ upgini/metadata.py,sha256=Jh6YTaS00m_nbaOY_owvlSyn9zgkErkqu8iTr9ZjKI8,12279
10
10
  upgini/metrics.py,sha256=hr7UwLphbZ_FEglLuO2lzr_pFgxOJ4c3WBeg7H-fNqY,35521
11
11
  upgini/search_task.py,sha256=qxUxAD-bed-FpZYmTB_4orW7YJsW_O6a1TcgnZIRFr4,17307
12
12
  upgini/spinner.py,sha256=4iMd-eIe_BnkqFEMIliULTbj6rNI2HkN_VJ4qYe0cUc,1118
@@ -59,7 +59,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
59
59
  upgini/utils/target_utils.py,sha256=RlpKGss9kMibVSlA8iZuO_qxmyeplqzn7X8g6hiGGGs,14341
60
60
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
61
61
  upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
62
- upgini-1.2.52a2.dist-info/METADATA,sha256=uP3OiyWH3nLIqCeEsbr1b6-2T3WR5X_uhjn7wyyDH4M,49057
63
- upgini-1.2.52a2.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
64
- upgini-1.2.52a2.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
65
- upgini-1.2.52a2.dist-info/RECORD,,
62
+ upgini-1.2.54.dist-info/METADATA,sha256=UsKRAySU92ST26c9W_bfCOMEYHBNOQTweVVeL4mfA9I,49055
63
+ upgini-1.2.54.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
64
+ upgini-1.2.54.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
65
+ upgini-1.2.54.dist-info/RECORD,,