upgini 1.2.27__py3-none-any.whl → 1.2.28__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- upgini/__about__.py +1 -1
- upgini/features_enricher.py +14 -7
- upgini/resource_bundle/strings.properties +2 -2
- {upgini-1.2.27.dist-info → upgini-1.2.28.dist-info}/METADATA +1 -1
- {upgini-1.2.27.dist-info → upgini-1.2.28.dist-info}/RECORD +7 -7
- {upgini-1.2.27.dist-info → upgini-1.2.28.dist-info}/WHEEL +0 -0
- {upgini-1.2.27.dist-info → upgini-1.2.28.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "1.2.
|
|
1
|
+
__version__ = "1.2.28"
|
upgini/features_enricher.py
CHANGED
|
@@ -2026,7 +2026,10 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
2026
2026
|
start_time = time.time()
|
|
2027
2027
|
with MDC(trace_id=trace_id):
|
|
2028
2028
|
self.logger.info("Start transform")
|
|
2029
|
-
|
|
2029
|
+
|
|
2030
|
+
validated_X = self._validate_X(X, is_transform=True)
|
|
2031
|
+
|
|
2032
|
+
self.__log_debug_information(validated_X, exclude_features_sources=exclude_features_sources)
|
|
2030
2033
|
|
|
2031
2034
|
self.__validate_search_keys(self.search_keys, self.search_id)
|
|
2032
2035
|
|
|
@@ -2058,8 +2061,6 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
2058
2061
|
self.logger.info(msg)
|
|
2059
2062
|
print(msg)
|
|
2060
2063
|
|
|
2061
|
-
validated_X = self._validate_X(X, is_transform=True)
|
|
2062
|
-
|
|
2063
2064
|
is_demo_dataset = hash_input(validated_X) in DEMO_DATASET_HASHES
|
|
2064
2065
|
|
|
2065
2066
|
columns_to_drop = [c for c in validated_X.columns if c in self.feature_names_]
|
|
@@ -2476,9 +2477,9 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
2476
2477
|
validate_scoring_argument(scoring)
|
|
2477
2478
|
|
|
2478
2479
|
self.__log_debug_information(
|
|
2479
|
-
|
|
2480
|
-
|
|
2481
|
-
|
|
2480
|
+
validated_X,
|
|
2481
|
+
validated_y,
|
|
2482
|
+
validated_eval_set,
|
|
2482
2483
|
exclude_features_sources=exclude_features_sources,
|
|
2483
2484
|
calculate_metrics=calculate_metrics,
|
|
2484
2485
|
scoring=scoring,
|
|
@@ -3762,11 +3763,17 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
3762
3763
|
if len(passed_unsupported_search_keys) > 0:
|
|
3763
3764
|
raise ValidationError(self.bundle.get("unsupported_search_key").format(passed_unsupported_search_keys))
|
|
3764
3765
|
|
|
3766
|
+
x_columns = [
|
|
3767
|
+
c
|
|
3768
|
+
for c in x.columns
|
|
3769
|
+
if c not in [TARGET, EVAL_SET_INDEX, SYSTEM_RECORD_ID, ENTITY_SYSTEM_RECORD_ID, SEARCH_KEY_UNNEST]
|
|
3770
|
+
]
|
|
3771
|
+
|
|
3765
3772
|
for column_id, meaning_type in search_keys.items():
|
|
3766
3773
|
column_name = None
|
|
3767
3774
|
if isinstance(column_id, str):
|
|
3768
3775
|
if column_id not in x.columns:
|
|
3769
|
-
raise ValidationError(self.bundle.get("search_key_not_found").format(column_id,
|
|
3776
|
+
raise ValidationError(self.bundle.get("search_key_not_found").format(column_id, x_columns))
|
|
3770
3777
|
column_name = column_id
|
|
3771
3778
|
valid_search_keys[column_name] = meaning_type
|
|
3772
3779
|
elif isinstance(column_id, int):
|
|
@@ -201,7 +201,7 @@ email_detected=Emails detected in column `{}`. It will be used as a search key\n
|
|
|
201
201
|
email_detected_not_registered=Emails detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns
|
|
202
202
|
phone_detected=Phone numbers detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns
|
|
203
203
|
phone_detected_not_registered=Phone numbers detected in column `{}`. It can be used only with api_key from profile.upgini.com\nSee docs to turn off the automatic detection: https://github.com/upgini/upgini/blob/main/README.md#turn-off-autodetection-for-search-key-columns
|
|
204
|
-
target_type_detected
|
|
204
|
+
target_type_detected=\nDetected task type: {}. Reason: {}\nYou can set task type manually with argument `model_task_type` of FeaturesEnricher constructor if task type detected incorrectly\n
|
|
205
205
|
binary_target_reason=only two unique label-values observed
|
|
206
206
|
non_numeric_multiclass_reason=non-numeric label values observed
|
|
207
207
|
few_unique_label_multiclass_reason=few unique label-values observed and can be considered as categorical
|
|
@@ -212,7 +212,7 @@ limited_int_multiclass_reason=integer-like values with limited unique values obs
|
|
|
212
212
|
all_ok_community_invite=❓ Support request
|
|
213
213
|
too_small_for_metrics=Your train dataset or one of eval datasets contains less than 500 rows. For such dataset Upgini will not calculate accuracy metrics. Please increase the number of rows in the training dataset to calculate accuracy metrics
|
|
214
214
|
imbalance_multiclass=Class {0} is on 25% quantile of classes distribution ({1} records in train dataset). \nDownsample classes with records more than {1}.
|
|
215
|
-
imbalanced_target
|
|
215
|
+
imbalanced_target=\nTarget is imbalanced and will be undersampled. Frequency of the rarest class `{}` is {}
|
|
216
216
|
loss_selection_info=Using loss `{}` for feature selection
|
|
217
217
|
loss_calc_metrics_info=Using loss `{}` for metrics calculation with default estimator
|
|
218
218
|
|
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
upgini/__about__.py,sha256=
|
|
1
|
+
upgini/__about__.py,sha256=sZoYrdh97RjbwC1rg-3mt6kqvjxTxWL7ejhDDrG6mVM,23
|
|
2
2
|
upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
|
|
3
3
|
upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
|
|
4
4
|
upgini/dataset.py,sha256=iPFiMJtk4HF1ytw9wCQr8H9RfoOKj_TIo8XYZKWgcMc,31331
|
|
5
5
|
upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
|
|
6
|
-
upgini/features_enricher.py,sha256=
|
|
6
|
+
upgini/features_enricher.py,sha256=YYboYw--vCH9VerkTnCF3njztU3fVLrhlhU3NfBVJYQ,194302
|
|
7
7
|
upgini/http.py,sha256=21asexflvavydzCOONJDGQBtQanCElrbnqLXakJ9Cu8,42880
|
|
8
8
|
upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
|
|
9
9
|
upgini/metadata.py,sha256=osmzdNESeh7yP3BZday6N9Q3eaIHfzhhRM1d6NSgcf0,11223
|
|
@@ -30,7 +30,7 @@ upgini/normalizer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
|
|
30
30
|
upgini/normalizer/normalize_utils.py,sha256=Ft2MwSgVoBilXAORAOYAuwPD79GOLfwn4qQE3IUFzzg,7218
|
|
31
31
|
upgini/resource_bundle/__init__.py,sha256=S5F2G47pnJd2LDpmFsjDqEwiKkP8Hm-hcseDbMka6Ko,8345
|
|
32
32
|
upgini/resource_bundle/exceptions.py,sha256=5fRvx0_vWdE1-7HcSgF0tckB4A9AKyf5RiinZkInTsI,621
|
|
33
|
-
upgini/resource_bundle/strings.properties,sha256=
|
|
33
|
+
upgini/resource_bundle/strings.properties,sha256=wn98wl2DNFPaGTMSdZAVr43P6t97i74PCqqwa762-V0,26673
|
|
34
34
|
upgini/resource_bundle/strings_widget.properties,sha256=gOdqvZWntP2LCza_tyVk1_yRYcG4c04K9sQOAVhF_gw,1577
|
|
35
35
|
upgini/sampler/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
36
36
|
upgini/sampler/base.py,sha256=7GpjYqjOp58vYcJLiX__1R5wjUlyQbxvHJ2klFnup_M,6389
|
|
@@ -58,7 +58,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
|
|
|
58
58
|
upgini/utils/target_utils.py,sha256=PU77nIhTz7IHbC4rpTpxrVxib6cdpRL9F1dhkjIffLY,10225
|
|
59
59
|
upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
|
|
60
60
|
upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
|
|
61
|
-
upgini-1.2.
|
|
62
|
-
upgini-1.2.
|
|
63
|
-
upgini-1.2.
|
|
64
|
-
upgini-1.2.
|
|
61
|
+
upgini-1.2.28.dist-info/METADATA,sha256=qGINKPrh43Q1LFXWRlS1v6CSpME6rOmScAy0ShKxL_0,48578
|
|
62
|
+
upgini-1.2.28.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
|
|
63
|
+
upgini-1.2.28.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
|
|
64
|
+
upgini-1.2.28.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|