upgini 1.2.51__py3-none-any.whl → 1.2.52a1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.51"
1
+ __version__ = "1.2.52a1"
@@ -2270,7 +2270,6 @@ if response.status_code == 200:
2270
2270
  df = converter.convert(df)
2271
2271
 
2272
2272
  ip_column = self._get_ip_column(search_keys)
2273
- ip_prefix_column = None
2274
2273
  if ip_column:
2275
2274
  converter = IpSearchKeyConverter(
2276
2275
  ip_column,
@@ -2281,7 +2280,6 @@ if response.status_code == 200:
2281
2280
  self.logger,
2282
2281
  )
2283
2282
  df = converter.convert(df)
2284
- ip_prefix_column = converter.ip_prefix_column
2285
2283
 
2286
2284
  phone_column = self._get_phone_column(search_keys)
2287
2285
  country_column = self._get_country_column(search_keys)
@@ -2301,15 +2299,12 @@ if response.status_code == 200:
2301
2299
  # generated_features = [f for f in generated_features if f in self.fit_generated_features]
2302
2300
 
2303
2301
  meaning_types = {col: key.value for col, key in search_keys.items()}
2304
- if ip_prefix_column:
2305
- meaning_types[ip_prefix_column] = FileColumnMeaningType.IP_PREFIX
2306
2302
  for col in features_for_transform:
2307
2303
  meaning_types[col] = FileColumnMeaningType.FEATURE
2308
2304
  features_not_to_pass = [
2309
2305
  c
2310
2306
  for c in df.columns
2311
2307
  if c not in search_keys.keys()
2312
- and c != ip_prefix_column
2313
2308
  and c not in features_for_transform
2314
2309
  and c not in [ENTITY_SYSTEM_RECORD_ID, SEARCH_KEY_UNNEST]
2315
2310
  ]
@@ -2771,7 +2766,6 @@ if response.status_code == 200:
2771
2766
  df = converter.convert(df)
2772
2767
 
2773
2768
  ip_column = self._get_ip_column(self.fit_search_keys)
2774
- ip_prefix_column = None
2775
2769
  if ip_column:
2776
2770
  converter = IpSearchKeyConverter(
2777
2771
  ip_column,
@@ -2782,7 +2776,6 @@ if response.status_code == 200:
2782
2776
  self.logger,
2783
2777
  )
2784
2778
  df = converter.convert(df)
2785
- ip_prefix_column = converter.ip_prefix_column
2786
2779
  phone_column = self._get_phone_column(self.fit_search_keys)
2787
2780
  country_column = self._get_country_column(self.fit_search_keys)
2788
2781
  if phone_column:
@@ -2803,7 +2796,6 @@ if response.status_code == 200:
2803
2796
  EVAL_SET_INDEX,
2804
2797
  ENTITY_SYSTEM_RECORD_ID,
2805
2798
  SEARCH_KEY_UNNEST,
2806
- ip_prefix_column,
2807
2799
  ] + list(self.fit_search_keys.keys())
2808
2800
  if DateTimeSearchKeyConverter.DATETIME_COL in df.columns:
2809
2801
  non_feature_columns.append(DateTimeSearchKeyConverter.DATETIME_COL)
@@ -2825,8 +2817,6 @@ if response.status_code == 200:
2825
2817
  **{col: key.value for col, key in self.fit_search_keys.items()},
2826
2818
  **{str(c): FileColumnMeaningType.FEATURE for c in df.columns if c not in non_feature_columns},
2827
2819
  }
2828
- if ip_prefix_column:
2829
- meaning_types[ip_prefix_column] = FileColumnMeaningType.IP_PREFIX
2830
2820
  meaning_types[self.TARGET_NAME] = FileColumnMeaningType.TARGET
2831
2821
  meaning_types[ENTITY_SYSTEM_RECORD_ID] = FileColumnMeaningType.ENTITY_SYSTEM_RECORD_ID
2832
2822
  if SEARCH_KEY_UNNEST in df.columns:
upgini/utils/ip_utils.py CHANGED
@@ -33,7 +33,6 @@ class IpSearchKeyConverter:
33
33
  else:
34
34
  self.logger = logging.getLogger()
35
35
  self.logger.setLevel("FATAL")
36
- self.ip_prefix_column = None
37
36
 
38
37
  @staticmethod
39
38
  def _ip_to_int(ip: Optional[_BaseAddress]) -> Optional[int]:
@@ -131,16 +130,18 @@ class IpSearchKeyConverter:
131
130
  # )
132
131
  ip_binary = self.ip_column + "_binary"
133
132
  df[ip_binary] = df[self.ip_column].apply(self._ip_to_binary)
134
- self.ip_prefix_column = self.ip_column + "_prefix"
135
- df[self.ip_prefix_column] = df[self.ip_column].apply(self._ip_to_prefix)
133
+ ip_prefix_column = self.ip_column + "_prefix"
134
+ df[ip_prefix_column] = df[self.ip_column].apply(self._ip_to_prefix)
136
135
 
137
136
  df = df.drop(columns=self.ip_column)
138
137
  del self.search_keys[self.ip_column]
139
138
  del self.columns_renaming[self.ip_column]
140
139
  # self.search_keys[ipv6] = SearchKey.IPV6_ADDRESS
141
140
  self.search_keys[ip_binary] = SearchKey.IP_BINARY
141
+ self.search_keys[ip_prefix_column] = SearchKey.IP_PREFIX
142
142
  # self.columns_renaming[ipv6] = original_ip
143
143
  self.columns_renaming[ip_binary] = original_ip
144
+ self.columns_renaming[ip_prefix_column] = original_ip
144
145
 
145
146
  return df
146
147
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.51
3
+ Version: 1.2.52a1
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -1,9 +1,9 @@
1
- upgini/__about__.py,sha256=kgsz9u_lLDc3N0akch6v9PpMXz_PW7_aEHXRb1pWgHg,23
1
+ upgini/__about__.py,sha256=wXtlppy0_s1dq-G-GaZi3gwzfakXg3YvHVznKZGFQDU,25
2
2
  upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=vT4JyHmafLNbj54SySXr93f5hNS6-t94aFslbBy-7No,33535
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=80h-1a-UxhuknvuEk1tQk5q5dckqlD_DHzNfufNuaPI,201110
6
+ upgini/features_enricher.py,sha256=mDpz2NcNBItvfdE2EllEetnv7-ApODXg0FQleYrGIfg,200628
7
7
  upgini/http.py,sha256=danPeX7nTMa_70S-pk-4UUm5yOvXYlR84jgyjoHYBkU,43367
8
8
  upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
9
9
  upgini/metadata.py,sha256=zuLdt5XyO_ZH4VsUNshzRHgv6VfYiXy0M8jeohloFBw,12082
@@ -51,7 +51,7 @@ upgini/utils/fallback_progress_bar.py,sha256=PDaKb8dYpVZaWMroNcOHsTc3pSjgi9mOm0-
51
51
  upgini/utils/feature_info.py,sha256=0rOXSyCj-sw-8migWP0ge8qrOzGU50dQvH0JUJUrDfQ,6766
52
52
  upgini/utils/features_validator.py,sha256=lEfmk4DoxZ4ooOE1HC0ZXtUb_lFKRFHIrnFULZ4_rL8,3746
53
53
  upgini/utils/format.py,sha256=Yv5cvvSs2bOLUzzNu96Pu33VMDNbabio92QepUj41jU,243
54
- upgini/utils/ip_utils.py,sha256=GZqBaV-nky-_Yb9KclmTrYovCG4kawYcbdjEpw1e5Mo,6500
54
+ upgini/utils/ip_utils.py,sha256=TSQ_qDsLlVnm09X1HacpabEf_HNqSWpxBF4Sdc2xs08,6580
55
55
  upgini/utils/phone_utils.py,sha256=IrbztLuOJBiePqqxllfABWfYlfAjYevPhXKipl95wUI,10432
56
56
  upgini/utils/postal_code_utils.py,sha256=5M0sUqH2DAr33kARWCTXR-ACyzWbjDq_-0mmEml6ZcU,1716
57
57
  upgini/utils/progress_bar.py,sha256=N-Sfdah2Hg8lXP_fV9EfUTXz_PyRt4lo9fAHoUDOoLc,1550
@@ -59,7 +59,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
59
59
  upgini/utils/target_utils.py,sha256=RlpKGss9kMibVSlA8iZuO_qxmyeplqzn7X8g6hiGGGs,14341
60
60
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
61
61
  upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
62
- upgini-1.2.51.dist-info/METADATA,sha256=WXti81Fx4H5NawX2D7XvQ5cPEUVi4mlMkykbn94gXKI,49055
63
- upgini-1.2.51.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
64
- upgini-1.2.51.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
65
- upgini-1.2.51.dist-info/RECORD,,
62
+ upgini-1.2.52a1.dist-info/METADATA,sha256=ULQbMINkgtgLFKJr0CmuC24XCQhLGb6ovLA-8pHSGjE,49057
63
+ upgini-1.2.52a1.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
64
+ upgini-1.2.52a1.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
65
+ upgini-1.2.52a1.dist-info/RECORD,,