upgini 1.2.81a3853.dev2__py3-none-any.whl → 1.2.82__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- upgini/__about__.py +1 -1
- upgini/autofe/feature.py +2 -2
- upgini/dataset.py +1 -1
- upgini/features_enricher.py +4 -1
- {upgini-1.2.81a3853.dev2.dist-info → upgini-1.2.82.dist-info}/METADATA +1 -1
- {upgini-1.2.81a3853.dev2.dist-info → upgini-1.2.82.dist-info}/RECORD +8 -8
- {upgini-1.2.81a3853.dev2.dist-info → upgini-1.2.82.dist-info}/WHEEL +1 -1
- {upgini-1.2.81a3853.dev2.dist-info → upgini-1.2.82.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
@@ -1 +1 @@
|
|
1
|
-
__version__ = "1.2.
|
1
|
+
__version__ = "1.2.82"
|
upgini/autofe/feature.py
CHANGED
@@ -161,7 +161,7 @@ class Feature:
|
|
161
161
|
if self.cached_display_name is not None and cache:
|
162
162
|
return self.cached_display_name
|
163
163
|
|
164
|
-
should_stack_op = not isinstance(self.children[
|
164
|
+
should_stack_op = not isinstance(self.children[0], Column) if self.op.is_unary else False
|
165
165
|
components = []
|
166
166
|
|
167
167
|
if self.alias:
|
@@ -169,7 +169,7 @@ class Feature:
|
|
169
169
|
elif should_stack_op:
|
170
170
|
components.extend(
|
171
171
|
[
|
172
|
-
self.children[
|
172
|
+
self.children[0].get_display_name(
|
173
173
|
cache=cache, shorten=shorten, use_op_alias=use_op_alias, **kwargs
|
174
174
|
),
|
175
175
|
self.get_op_display_name(use_alias=use_op_alias),
|
upgini/dataset.py
CHANGED
@@ -394,7 +394,7 @@ class Dataset: # (pd.DataFrame):
|
|
394
394
|
if col in mandatory_columns:
|
395
395
|
self.data["valid_mandatory"] = self.data["valid_mandatory"] & self.data[f"{col}_is_valid"]
|
396
396
|
|
397
|
-
invalid_values = list(self.data.loc[self.data[f"{col}_is_valid"] == 0, col].head().values)
|
397
|
+
invalid_values = list(set(self.data.loc[self.data[f"{col}_is_valid"] == 0, col].head().values))
|
398
398
|
valid_share = self.data[f"{col}_is_valid"].sum() / nrows
|
399
399
|
original_col_name = self.columns_renaming[col]
|
400
400
|
validation_stats[original_col_name] = {}
|
upgini/features_enricher.py
CHANGED
@@ -1559,9 +1559,12 @@ class FeaturesEnricher(TransformerMixin):
|
|
1559
1559
|
fitting_X = X_sorted[client_features].copy()
|
1560
1560
|
fitting_enriched_X = enriched_X_sorted[client_features + existing_filtered_enriched_features].copy()
|
1561
1561
|
|
1562
|
+
renamed_generate_features = [columns_renaming.get(c, c) for c in (self.generate_features or [])]
|
1563
|
+
renamed_client_cat_features = [columns_renaming.get(c, c) for c in (client_cat_features or [])]
|
1564
|
+
|
1562
1565
|
# Detect and drop high cardinality columns in train
|
1563
1566
|
columns_with_high_cardinality = FeaturesValidator.find_high_cardinality(fitting_X)
|
1564
|
-
non_excluding_columns =
|
1567
|
+
non_excluding_columns = renamed_generate_features + renamed_client_cat_features
|
1565
1568
|
columns_with_high_cardinality = [c for c in columns_with_high_cardinality if c not in non_excluding_columns]
|
1566
1569
|
if len(columns_with_high_cardinality) > 0:
|
1567
1570
|
self.logger.warning(
|
@@ -1,9 +1,9 @@
|
|
1
|
-
upgini/__about__.py,sha256=
|
1
|
+
upgini/__about__.py,sha256=wIfaTYNNq8gXQfG6X1cQaeNbsFlmRpelLJv8NMITZE0,23
|
2
2
|
upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
|
3
3
|
upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
|
4
|
-
upgini/dataset.py,sha256=
|
4
|
+
upgini/dataset.py,sha256=fRtqSkXNONLnPe6cCL967GMt349FTIpXzy_u8LUKncw,35354
|
5
5
|
upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
|
6
|
-
upgini/features_enricher.py,sha256=
|
6
|
+
upgini/features_enricher.py,sha256=jq7y3KNAMd3oVi6whIY5PU3ikfrZs7mg4U_ILfuinm4,213024
|
7
7
|
upgini/http.py,sha256=AfaJ3c8z_tK2hZFEehNybDKE0mp1tYcyAP_l0_p8bLQ,43933
|
8
8
|
upgini/metadata.py,sha256=zt_9k0iQbWXuiRZcel4ORNPdQKt6Ou69ucZD_E1Q46o,12341
|
9
9
|
upgini/metrics.py,sha256=3cip0_L6-OFew74KsRwzxJDU6UFq05h2v7IsyHLcMRc,43164
|
@@ -16,7 +16,7 @@ upgini/autofe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
16
16
|
upgini/autofe/all_operators.py,sha256=rdjF5eaE4bC6Q4eu_el5Z7ekYt8DjOFermz2bePPbUc,333
|
17
17
|
upgini/autofe/binary.py,sha256=oOEECc4nRzZN2tYaiqx8F2XHnfWpk1bVvb7ZkZJ0lO8,7709
|
18
18
|
upgini/autofe/date.py,sha256=MM1S-6imNSzCDOhbNnmsc_bwSqUWBcS8vWAdHF8j1kY,11134
|
19
|
-
upgini/autofe/feature.py,sha256=
|
19
|
+
upgini/autofe/feature.py,sha256=G_YgnsauIoaMgByx9JXDPiKc4nqs0pwWZUfvoIGMKxY,15305
|
20
20
|
upgini/autofe/groupby.py,sha256=IYmQV9uoCdRcpkeWZj_kI3ObzoNCNx3ff3h8sTL01tk,3603
|
21
21
|
upgini/autofe/operator.py,sha256=EOffJw6vKXpEh5yymqb1RFNJPxGxmnHdFRo9dB5SCFo,4969
|
22
22
|
upgini/autofe/unary.py,sha256=Sx11IoHRh5nwyALzjgG9GQOrVNIs8NZ1JzunAJuN66A,5731
|
@@ -70,7 +70,7 @@ upgini/utils/target_utils.py,sha256=LRN840dzx78-wg7ftdxAkp2c1eu8-JDvkACiRThm4HE,
|
|
70
70
|
upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
|
71
71
|
upgini/utils/ts_utils.py,sha256=26vhC0pN7vLXK6R09EEkMK3Lwb9IVPH7LRdqFIQ3kPs,1383
|
72
72
|
upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
|
73
|
-
upgini-1.2.
|
74
|
-
upgini-1.2.
|
75
|
-
upgini-1.2.
|
76
|
-
upgini-1.2.
|
73
|
+
upgini-1.2.82.dist-info/METADATA,sha256=cambuYE-iqUo5mvnJN1CI1Qn8QgqdM5e54-h2giPj50,49162
|
74
|
+
upgini-1.2.82.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
|
75
|
+
upgini-1.2.82.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
|
76
|
+
upgini-1.2.82.dist-info/RECORD,,
|
File without changes
|