upgini 1.2.135a1__py3-none-any.whl → 1.2.135a3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- upgini/__about__.py +1 -1
- upgini/dataset.py +1 -0
- upgini/features_enricher.py +13 -7
- upgini/utils/features_validator.py +5 -3
- {upgini-1.2.135a1.dist-info → upgini-1.2.135a3.dist-info}/METADATA +1 -1
- {upgini-1.2.135a1.dist-info → upgini-1.2.135a3.dist-info}/RECORD +8 -8
- {upgini-1.2.135a1.dist-info → upgini-1.2.135a3.dist-info}/WHEEL +0 -0
- {upgini-1.2.135a1.dist-info → upgini-1.2.135a3.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "1.2.
|
|
1
|
+
__version__ = "1.2.135a3"
|
upgini/dataset.py
CHANGED
|
@@ -285,6 +285,7 @@ class Dataset:
|
|
|
285
285
|
for key in search_group
|
|
286
286
|
if key in self.columns_renaming
|
|
287
287
|
and not self.columns_renaming.get(key).endswith(EmailSearchKeyConverter.ONE_DOMAIN_SUFFIX)
|
|
288
|
+
and not self.columns_renaming.get(key) == "current_date"
|
|
288
289
|
}
|
|
289
290
|
ipv4_column = self.etalon_def_checked.get(FileColumnMeaningType.IP_ADDRESS.value)
|
|
290
291
|
if (
|
upgini/features_enricher.py
CHANGED
|
@@ -814,7 +814,7 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
814
814
|
keep_input=keep_input,
|
|
815
815
|
)
|
|
816
816
|
if TARGET in result.columns:
|
|
817
|
-
result.drop(columns=TARGET
|
|
817
|
+
result = result.drop(columns=TARGET)
|
|
818
818
|
self.logger.info("Transform finished successfully")
|
|
819
819
|
search_progress = SearchProgress(100.0, ProgressStage.FINISHED)
|
|
820
820
|
if progress_bar is not None:
|
|
@@ -1047,7 +1047,8 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
1047
1047
|
with Spinner():
|
|
1048
1048
|
self._check_train_and_eval_target_distribution(y_sorted, fitting_eval_set_dict)
|
|
1049
1049
|
|
|
1050
|
-
|
|
1050
|
+
date_col = self._get_date_column(search_keys)
|
|
1051
|
+
has_date = date_col is not None and date_col in validated_X.columns
|
|
1051
1052
|
model_task_type = self.model_task_type or define_task(y_sorted, has_date, self.logger, silent=True)
|
|
1052
1053
|
cat_features = list(set(client_cat_features + cat_features_from_backend))
|
|
1053
1054
|
has_time = has_date and isinstance(_cv, TimeSeriesSplit) or isinstance(_cv, BlockedTimeSeriesSplit)
|
|
@@ -1323,7 +1324,7 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
1323
1324
|
search_keys = {str(k): v for k, v in search_keys.items()}
|
|
1324
1325
|
|
|
1325
1326
|
date_column = self._get_date_column(search_keys)
|
|
1326
|
-
has_date = date_column is not None
|
|
1327
|
+
has_date = date_column is not None and date_column in validated_X.columns
|
|
1327
1328
|
if not has_date:
|
|
1328
1329
|
self.logger.info("No date column for OOT PSI calculation")
|
|
1329
1330
|
return
|
|
@@ -2087,7 +2088,8 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
2087
2088
|
search_keys = self.fit_search_keys.copy()
|
|
2088
2089
|
|
|
2089
2090
|
rows_to_drop = None
|
|
2090
|
-
|
|
2091
|
+
date_column = self._get_date_column(search_keys)
|
|
2092
|
+
has_date = date_column is not None and date_column in validated_X.columns
|
|
2091
2093
|
self.model_task_type = self.model_task_type or define_task(
|
|
2092
2094
|
self.df_with_original_index[TARGET], has_date, self.logger, silent=True
|
|
2093
2095
|
)
|
|
@@ -2954,7 +2956,10 @@ if response.status_code == 200:
|
|
|
2954
2956
|
is_transform: bool = False,
|
|
2955
2957
|
):
|
|
2956
2958
|
fit_input_columns = [c.originalName for c in self._search_task.get_file_metadata(trace_id).columns]
|
|
2957
|
-
|
|
2959
|
+
original_dropped_features = [self.fit_columns_renaming.get(c, c) for c in self.fit_dropped_features]
|
|
2960
|
+
new_columns_on_transform = [
|
|
2961
|
+
c for c in validated_Xy.columns if c not in fit_input_columns and c not in original_dropped_features
|
|
2962
|
+
]
|
|
2958
2963
|
|
|
2959
2964
|
selected_generated_features = [c for c in generated_features if c in self.feature_names_]
|
|
2960
2965
|
if keep_input is True:
|
|
@@ -3129,7 +3134,7 @@ if response.status_code == 200:
|
|
|
3129
3134
|
self.fit_search_keys = self.__prepare_search_keys(df, self.fit_search_keys, is_demo_dataset)
|
|
3130
3135
|
|
|
3131
3136
|
maybe_date_column = SearchKey.find_key(self.fit_search_keys, [SearchKey.DATE, SearchKey.DATETIME])
|
|
3132
|
-
has_date = maybe_date_column is not None
|
|
3137
|
+
has_date = maybe_date_column is not None and maybe_date_column in validated_X.columns
|
|
3133
3138
|
|
|
3134
3139
|
self.model_task_type = self.model_task_type or define_task(validated_y, has_date, self.logger)
|
|
3135
3140
|
|
|
@@ -3763,7 +3768,8 @@ if response.status_code == 200:
|
|
|
3763
3768
|
if eval_set is None:
|
|
3764
3769
|
return None
|
|
3765
3770
|
validated_eval_set = []
|
|
3766
|
-
|
|
3771
|
+
date_col = self._get_date_column(self.search_keys)
|
|
3772
|
+
has_date = date_col is not None and date_col in X.columns
|
|
3767
3773
|
for idx, eval_pair in enumerate(eval_set):
|
|
3768
3774
|
validated_pair = self._validate_eval_set_pair(X, eval_pair)
|
|
3769
3775
|
if validated_pair[1].isna().all():
|
|
@@ -44,12 +44,14 @@ class FeaturesValidator:
|
|
|
44
44
|
else:
|
|
45
45
|
empty_or_constant_features.append(f)
|
|
46
46
|
|
|
47
|
+
columns_renaming = columns_renaming or {}
|
|
48
|
+
|
|
47
49
|
if one_hot_encoded_features:
|
|
48
|
-
msg = bundle.get("one_hot_encoded_features").format(
|
|
50
|
+
msg = bundle.get("one_hot_encoded_features").format(
|
|
51
|
+
[columns_renaming.get(f, f) for f in one_hot_encoded_features]
|
|
52
|
+
)
|
|
49
53
|
warnings.append(msg)
|
|
50
54
|
|
|
51
|
-
columns_renaming = columns_renaming or {}
|
|
52
|
-
|
|
53
55
|
if empty_or_constant_features:
|
|
54
56
|
msg = bundle.get("empty_or_contant_features").format(
|
|
55
57
|
[columns_renaming.get(f, f) for f in empty_or_constant_features]
|
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
upgini/__about__.py,sha256=
|
|
1
|
+
upgini/__about__.py,sha256=zKar2BSHx-M-ruW4V1DQDr70UfG-vBoiDPsQB4duA-c,26
|
|
2
2
|
upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
|
|
3
3
|
upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
|
|
4
|
-
upgini/dataset.py,sha256=
|
|
4
|
+
upgini/dataset.py,sha256=qXo1eAUM21jmNMYGa6IeGuRJmjU3jtCieS4sAVVIfXs,31721
|
|
5
5
|
upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
|
|
6
|
-
upgini/features_enricher.py,sha256=
|
|
6
|
+
upgini/features_enricher.py,sha256=dC71_-18cqymS26EhEnfYnZFGDvRtvW6Pga4ZtJN-BI,235485
|
|
7
7
|
upgini/http.py,sha256=-J_wOpnwVnT0ebPC6sOs6fN3AWtCD0LJLu6nlYmxaqk,44348
|
|
8
8
|
upgini/metadata.py,sha256=H3wiN37k-yqWZgbPD0tJzx8DzaCIkgmX5cybhByQWLg,12619
|
|
9
9
|
upgini/metrics.py,sha256=KCPE_apPN-9BIdv6GqASbJVaB_gBcy8wzNApAcyaGo4,46020
|
|
@@ -58,7 +58,7 @@ upgini/utils/display_utils.py,sha256=MoTqXZJvC6pAqgOaI3V0FG-IU_LnMfrn4TDcNvUqsdg
|
|
|
58
58
|
upgini/utils/email_utils.py,sha256=pZ2vCfNxLIPUhxr0-OlABNXm12jjU44isBk8kGmqQzA,5277
|
|
59
59
|
upgini/utils/fallback_progress_bar.py,sha256=PDaKb8dYpVZaWMroNcOHsTc3pSjgi9mOm0--cOFTwJ0,1074
|
|
60
60
|
upgini/utils/feature_info.py,sha256=SQTRbSxJDkh2G2c0KGBmOv8f69gVzWbTtcXn0_2Qb-8,7945
|
|
61
|
-
upgini/utils/features_validator.py,sha256=
|
|
61
|
+
upgini/utils/features_validator.py,sha256=RdRMisZYeJ8HVCKiKxqSyWjoLf_MsZNXxHIuWf6H2g4,4939
|
|
62
62
|
upgini/utils/format.py,sha256=Yv5cvvSs2bOLUzzNu96Pu33VMDNbabio92QepUj41jU,243
|
|
63
63
|
upgini/utils/hash_utils.py,sha256=mP2yHyzvDNdpa5g3B4MHzulxBeEz_ZSoGl1YF_VnAyE,5538
|
|
64
64
|
upgini/utils/ip_utils.py,sha256=wmnnwVQdjX9o1cNQw6VQMk6maHhvsq6hNsZBYf9knrw,6585
|
|
@@ -74,7 +74,7 @@ upgini/utils/target_utils.py,sha256=CihpV6SC95HwtlMH60rGAUzVDa4Id0Bva8ySprmNHlE,
|
|
|
74
74
|
upgini/utils/track_info.py,sha256=NDKeQTUlZaYp15UoP-xLKGoDoJQ0drbDMwB0g9R0PUg,6427
|
|
75
75
|
upgini/utils/ts_utils.py,sha256=26vhC0pN7vLXK6R09EEkMK3Lwb9IVPH7LRdqFIQ3kPs,1383
|
|
76
76
|
upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
|
|
77
|
-
upgini-1.2.
|
|
78
|
-
upgini-1.2.
|
|
79
|
-
upgini-1.2.
|
|
80
|
-
upgini-1.2.
|
|
77
|
+
upgini-1.2.135a3.dist-info/METADATA,sha256=p6JAaluvHU1B6Al8fHzq5KsgyNQvznWkEDwE1fhHuZI,51135
|
|
78
|
+
upgini-1.2.135a3.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
|
79
|
+
upgini-1.2.135a3.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
|
|
80
|
+
upgini-1.2.135a3.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|