upgini 1.2.71a3832.dev10__py3-none-any.whl → 1.2.71a3832.dev12__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- upgini/__about__.py +1 -1
- upgini/features_enricher.py +11 -9
- {upgini-1.2.71a3832.dev10.dist-info → upgini-1.2.71a3832.dev12.dist-info}/METADATA +1 -1
- {upgini-1.2.71a3832.dev10.dist-info → upgini-1.2.71a3832.dev12.dist-info}/RECORD +6 -6
- {upgini-1.2.71a3832.dev10.dist-info → upgini-1.2.71a3832.dev12.dist-info}/WHEEL +0 -0
- {upgini-1.2.71a3832.dev10.dist-info → upgini-1.2.71a3832.dev12.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
@@ -1 +1 @@
|
|
1
|
-
__version__ = "1.2.71a3832.
|
1
|
+
__version__ = "1.2.71a3832.dev12"
|
upgini/features_enricher.py
CHANGED
@@ -12,6 +12,7 @@ import tempfile
|
|
12
12
|
import time
|
13
13
|
import uuid
|
14
14
|
from collections import Counter
|
15
|
+
from copy import deepcopy
|
15
16
|
from dataclasses import dataclass
|
16
17
|
from threading import Thread
|
17
18
|
from typing import Any, Callable, Dict, List, Optional, Set, Tuple, Union
|
@@ -1512,10 +1513,7 @@ class FeaturesEnricher(TransformerMixin):
|
|
1512
1513
|
self.logger.info(f"Client features column on prepare data for metrics: {client_features}")
|
1513
1514
|
|
1514
1515
|
filtered_enriched_features = self.__filtered_enriched_features(
|
1515
|
-
importance_threshold,
|
1516
|
-
max_features,
|
1517
|
-
trace_id,
|
1518
|
-
validated_X
|
1516
|
+
importance_threshold, max_features, trace_id, validated_X
|
1519
1517
|
)
|
1520
1518
|
filtered_enriched_features = [c for c in filtered_enriched_features if c not in client_features]
|
1521
1519
|
|
@@ -2543,7 +2541,9 @@ if response.status_code == 200:
|
|
2543
2541
|
for c in itertools.chain(validated_Xy.columns.tolist(), generated_features)
|
2544
2542
|
if c not in self.dropped_client_feature_names_
|
2545
2543
|
]
|
2546
|
-
filtered_columns = self.__filtered_enriched_features(
|
2544
|
+
filtered_columns = self.__filtered_enriched_features(
|
2545
|
+
importance_threshold, max_features, trace_id, validated_X
|
2546
|
+
)
|
2547
2547
|
selecting_columns.extend(
|
2548
2548
|
c for c in filtered_columns if c in result.columns and c not in validated_X.columns
|
2549
2549
|
)
|
@@ -3813,6 +3813,7 @@ if response.status_code == 200:
|
|
3813
3813
|
features_meta = self._search_task.get_all_features_metadata_v2()
|
3814
3814
|
if features_meta is None:
|
3815
3815
|
raise Exception(self.bundle.get("missing_features_meta"))
|
3816
|
+
features_meta = deepcopy(features_meta)
|
3816
3817
|
|
3817
3818
|
original_names_dict = {c.name: c.originalName for c in self._search_task.get_file_metadata(trace_id).columns}
|
3818
3819
|
df = df.rename(columns=original_names_dict)
|
@@ -3839,7 +3840,7 @@ if response.status_code == 200:
|
|
3839
3840
|
continue
|
3840
3841
|
|
3841
3842
|
# Temporary workaround for duplicate features metadata
|
3842
|
-
if feature_meta.name in
|
3843
|
+
if feature_meta.name in importances:
|
3843
3844
|
self.logger.warning(f"WARNING: Duplicate feature metadata: {feature_meta}")
|
3844
3845
|
continue
|
3845
3846
|
|
@@ -3855,6 +3856,7 @@ if response.status_code == 200:
|
|
3855
3856
|
features_meta = self._search_task.get_all_features_metadata_v2()
|
3856
3857
|
if features_meta is None:
|
3857
3858
|
raise Exception(self.bundle.get("missing_features_meta"))
|
3859
|
+
features_meta = deepcopy(features_meta)
|
3858
3860
|
|
3859
3861
|
original_names_dict = {c.name: c.originalName for c in self._search_task.get_file_metadata(trace_id).columns}
|
3860
3862
|
features_df = self._search_task.get_all_initial_raw_features(trace_id, metrics_calculation=True)
|
@@ -4040,11 +4042,11 @@ if response.status_code == 200:
|
|
4040
4042
|
if len(filtered_importances) == 0:
|
4041
4043
|
return []
|
4042
4044
|
|
4043
|
-
filtered_importances = list(zip(self.feature_names_, self.feature_importances_))
|
4044
|
-
|
4045
4045
|
if importance_threshold is not None:
|
4046
4046
|
filtered_importances = [
|
4047
|
-
(name, importance)
|
4047
|
+
(name, importance)
|
4048
|
+
for name, importance in filtered_importances.items()
|
4049
|
+
if importance > importance_threshold
|
4048
4050
|
]
|
4049
4051
|
if max_features is not None:
|
4050
4052
|
filtered_importances = list(filtered_importances)[:max_features]
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.3
|
2
2
|
Name: upgini
|
3
|
-
Version: 1.2.71a3832.
|
3
|
+
Version: 1.2.71a3832.dev12
|
4
4
|
Summary: Intelligent data search & enrichment for Machine Learning
|
5
5
|
Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
|
6
6
|
Project-URL: Homepage, https://upgini.com/
|
@@ -1,9 +1,9 @@
|
|
1
|
-
upgini/__about__.py,sha256=
|
1
|
+
upgini/__about__.py,sha256=okx02f-XOrtKlpdtJnV-aHreGFvFkxZ5NQhd5zxvhMk,34
|
2
2
|
upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
|
3
3
|
upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
|
4
4
|
upgini/dataset.py,sha256=aspri7ZAgwkNNUiIgQ1GRXvw8XQii3F4RfNXSrF4wrw,35365
|
5
5
|
upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
|
6
|
-
upgini/features_enricher.py,sha256=
|
6
|
+
upgini/features_enricher.py,sha256=DgWboHEhr5BQT87MaAo2iUtrhapP3iqczLeZtWLRkDs,206664
|
7
7
|
upgini/http.py,sha256=RvzcShpDXssLs6ycGN8xilkKi8ZV9XGUrrk8bwdUzbw,43607
|
8
8
|
upgini/metadata.py,sha256=Yd6iW2f7Wz6vUkg5uvR4xylN16ANnCKVKqAsAkap7p8,12354
|
9
9
|
upgini/metrics.py,sha256=9AaQi7Yb22ZNnycUOAUpcP7TWF5Pfy_NGACcDj10aMs,38820
|
@@ -70,7 +70,7 @@ upgini/utils/target_utils.py,sha256=b1GzO8_gMcwXSZ2v98CY50MJJBzKbWHId_BJGybXfkM,
|
|
70
70
|
upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
|
71
71
|
upgini/utils/ts_utils.py,sha256=26vhC0pN7vLXK6R09EEkMK3Lwb9IVPH7LRdqFIQ3kPs,1383
|
72
72
|
upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
|
73
|
-
upgini-1.2.71a3832.
|
74
|
-
upgini-1.2.71a3832.
|
75
|
-
upgini-1.2.71a3832.
|
76
|
-
upgini-1.2.71a3832.
|
73
|
+
upgini-1.2.71a3832.dev12.dist-info/METADATA,sha256=8jmuNEDPwjc-Wa6Bds0FjYqYgqf3LFMYyRGUDy5DME8,49102
|
74
|
+
upgini-1.2.71a3832.dev12.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
|
75
|
+
upgini-1.2.71a3832.dev12.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
|
76
|
+
upgini-1.2.71a3832.dev12.dist-info/RECORD,,
|
File without changes
|
File without changes
|