upgini 1.2.145a4065.dev1__py3-none-any.whl → 1.2.146a2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.145a4065.dev1"
1
+ __version__ = "1.2.146a2"
upgini/dataset.py CHANGED
@@ -370,7 +370,10 @@ class Dataset:
370
370
  self.data["valid_keys"] = self.data["valid_keys"] + self.data[f"{col}_is_valid"]
371
371
  self.data.drop(columns=f"{col}_is_valid", inplace=True)
372
372
 
373
- self.data["is_valid"] = self.data["valid_keys"] > 0
373
+ if len(keys_to_validate) > 0:
374
+ self.data["is_valid"] = self.data["valid_keys"] > 0
375
+ else:
376
+ self.data["is_valid"] = True
374
377
  self.data["is_valid"] = self.data["is_valid"] & self.data["valid_mandatory"]
375
378
  self.data.drop(columns=["valid_keys", "valid_mandatory"], inplace=True)
376
379
 
@@ -3000,15 +3000,18 @@ if response.status_code == 200:
3000
3000
 
3001
3001
  return selected_input_columns + selected_generated_features
3002
3002
 
3003
- def __validate_search_keys(self, search_keys: dict[str, SearchKey], search_id: str | None = None):
3003
+ def _validate_empty_search_keys(
3004
+ self, search_keys: dict[str, SearchKey], is_transform: bool = False
3005
+ ):
3004
3006
  if (search_keys is None or len(search_keys) == 0) and self.country_code is None:
3005
- if search_id:
3006
- self.logger.debug(f"search_id {search_id} provided without search_keys")
3007
- return
3008
- # else:
3009
- # self.logger.warning("search_keys not provided")
3010
- # raise ValidationError(self.bundle.get("empty_search_keys"))
3007
+ if is_transform:
3008
+ self.logger.debug("Transform started without search_keys")
3009
+ # return
3010
+ else:
3011
+ self.logger.warning("search_keys not provided")
3012
+ # raise ValidationError(self.bundle.get("empty_search_keys"))
3011
3013
 
3014
+ def __validate_search_keys(self, search_keys: dict[str, SearchKey], search_id: str | None = None):
3012
3015
  key_types = search_keys.values()
3013
3016
 
3014
3017
  # Multiple search keys allowed only for PHONE, IP, POSTAL_CODE, EMAIL, HEM
@@ -4801,6 +4804,8 @@ if response.status_code == 200:
4801
4804
 
4802
4805
  self.logger.info(f"Prepared search keys: {valid_search_keys}")
4803
4806
 
4807
+ # x = self._validate_empty_search_keys(x, valid_search_keys, is_transform=is_transform)
4808
+
4804
4809
  return valid_search_keys
4805
4810
 
4806
4811
  def __show_metrics(
@@ -4941,10 +4946,6 @@ if response.status_code == 200:
4941
4946
  )
4942
4947
  self.__log_warning(self.bundle.get("phone_detected_not_registered"))
4943
4948
 
4944
- if (search_keys is None or len(search_keys) == 0) and self.country_code is None:
4945
- self.logger.warning("search_keys not provided")
4946
- raise ValidationError(self.bundle.get("empty_search_keys"))
4947
-
4948
4949
  return search_keys
4949
4950
 
4950
4951
  def _validate_binary_observations(self, y, task_type: ModelTaskType):
@@ -220,7 +220,7 @@ email_detected=Emails detected in column `{}`. It will be used as a search key\n
220
220
  email_detected_not_registered=Emails detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns\n
221
221
  phone_detected=Phone numbers detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns\n
222
222
  phone_detected_not_registered=Phone numbers detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns\n
223
- target_type_detected=\nDetected task type: {}. Reason: {}\nYou can set task type manually with argument `model_task_type` of FeaturesEnricher constructor if task type detected incorrectly\n
223
+ target_type_detected=Detected task type: {}. Reason: {}\nYou can set task type manually with argument `model_task_type` of FeaturesEnricher constructor if task type detected incorrectly\n
224
224
  binary_target_reason=only two unique label-values observed
225
225
  non_numeric_multiclass_reason=non-numeric label values observed
226
226
  few_unique_label_multiclass_reason=few unique label-values observed and can be considered as categorical
@@ -1,6 +1,6 @@
1
- Metadata-Version: 2.3
1
+ Metadata-Version: 2.4
2
2
  Name: upgini
3
- Version: 1.2.145a4065.dev1
3
+ Version: 1.2.146a2
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -1,9 +1,9 @@
1
- upgini/__about__.py,sha256=sGQj0neZ3Mr1HBsK38W-XFcr90YUqacEs101Tu9lFNI,34
1
+ upgini/__about__.py,sha256=CaqiZnz1z_roBKPQB2MiuGutl1Z1t1GG-7gzLCzKPL0,26
2
2
  upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
- upgini/dataset.py,sha256=bkUpUC1sdhCQcLPysB7BC8WiFDPfjiJj1SztExpv0nA,33735
4
+ upgini/dataset.py,sha256=JAxrKtzUvkqL2DGz6JbRLvGnvMnmH--Dc7YYIhJmwac,33832
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=1ErzgUYVS-oUmqC85o4IJTS4j_k9QryHqDIzw0YMdyU,235262
6
+ upgini/features_enricher.py,sha256=rwK0pXjnrSNjyCfg09aWgUJsnRi22uh9EaDekf-6hew,235244
7
7
  upgini/http.py,sha256=y26x4TQVYuEM3jz8JdASxSyBtvBemUkFf-FmX25sx-s,44356
8
8
  upgini/metadata.py,sha256=iYlL91g2PMHjiPIySIZb4IzIIUsPaAMIiV2It95GAjA,12866
9
9
  upgini/metrics.py,sha256=KCPE_apPN-9BIdv6GqASbJVaB_gBcy8wzNApAcyaGo4,46020
@@ -38,7 +38,7 @@ upgini/normalizer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
38
38
  upgini/normalizer/normalize_utils.py,sha256=mnOFU39oOsv_UhJVArl8BSocZlNP0xzgeAbSYI14Zjs,8492
39
39
  upgini/resource_bundle/__init__.py,sha256=S5F2G47pnJd2LDpmFsjDqEwiKkP8Hm-hcseDbMka6Ko,8345
40
40
  upgini/resource_bundle/exceptions.py,sha256=5fRvx0_vWdE1-7HcSgF0tckB4A9AKyf5RiinZkInTsI,621
41
- upgini/resource_bundle/strings.properties,sha256=GvOX9GZJaWxlL9X3FqtF3LyvPGVKyJniCzb5LVNiXwo,29710
41
+ upgini/resource_bundle/strings.properties,sha256=yuX7wZ8OV0_zqz8l-a--Sc6CqBtZSNQNY5cVRasRRSs,29708
42
42
  upgini/resource_bundle/strings_widget.properties,sha256=gOdqvZWntP2LCza_tyVk1_yRYcG4c04K9sQOAVhF_gw,1577
43
43
  upgini/sampler/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
44
44
  upgini/sampler/base.py,sha256=Fva2FEhLiNRPZ9Q6uOtJRtRzwsayjv7aphalAZO_4lc,6452
@@ -74,7 +74,7 @@ upgini/utils/target_utils.py,sha256=CihpV6SC95HwtlMH60rGAUzVDa4Id0Bva8ySprmNHlE,
74
74
  upgini/utils/track_info.py,sha256=NDKeQTUlZaYp15UoP-xLKGoDoJQ0drbDMwB0g9R0PUg,6427
75
75
  upgini/utils/ts_utils.py,sha256=26vhC0pN7vLXK6R09EEkMK3Lwb9IVPH7LRdqFIQ3kPs,1383
76
76
  upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
77
- upgini-1.2.145a4065.dev1.dist-info/METADATA,sha256=rs3PwyYF-R5YZvcfcaUwReFhownzxvNNlfpsSLiOiN8,51174
78
- upgini-1.2.145a4065.dev1.dist-info/WHEEL,sha256=zEMcRr9Kr03x1ozGwg5v9NQBKn3kndp6LSoSlVg-jhU,87
79
- upgini-1.2.145a4065.dev1.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
80
- upgini-1.2.145a4065.dev1.dist-info/RECORD,,
77
+ upgini-1.2.146a2.dist-info/METADATA,sha256=v5SEsK8mKw0EFiebVeHjngcjLPk5QbCU5iw6qsBVgQc,51166
78
+ upgini-1.2.146a2.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
79
+ upgini-1.2.146a2.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
80
+ upgini-1.2.146a2.dist-info/RECORD,,
@@ -1,4 +1,4 @@
1
1
  Wheel-Version: 1.0
2
- Generator: hatchling 1.24.2
2
+ Generator: hatchling 1.27.0
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any