upgini 1.2.71a3832.dev10__py3-none-any.whl → 1.2.71a3832.dev12__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.71a3832.dev10"
1
+ __version__ = "1.2.71a3832.dev12"
@@ -12,6 +12,7 @@ import tempfile
12
12
  import time
13
13
  import uuid
14
14
  from collections import Counter
15
+ from copy import deepcopy
15
16
  from dataclasses import dataclass
16
17
  from threading import Thread
17
18
  from typing import Any, Callable, Dict, List, Optional, Set, Tuple, Union
@@ -1512,10 +1513,7 @@ class FeaturesEnricher(TransformerMixin):
1512
1513
  self.logger.info(f"Client features column on prepare data for metrics: {client_features}")
1513
1514
 
1514
1515
  filtered_enriched_features = self.__filtered_enriched_features(
1515
- importance_threshold,
1516
- max_features,
1517
- trace_id,
1518
- validated_X
1516
+ importance_threshold, max_features, trace_id, validated_X
1519
1517
  )
1520
1518
  filtered_enriched_features = [c for c in filtered_enriched_features if c not in client_features]
1521
1519
 
@@ -2543,7 +2541,9 @@ if response.status_code == 200:
2543
2541
  for c in itertools.chain(validated_Xy.columns.tolist(), generated_features)
2544
2542
  if c not in self.dropped_client_feature_names_
2545
2543
  ]
2546
- filtered_columns = self.__filtered_enriched_features(importance_threshold, max_features)
2544
+ filtered_columns = self.__filtered_enriched_features(
2545
+ importance_threshold, max_features, trace_id, validated_X
2546
+ )
2547
2547
  selecting_columns.extend(
2548
2548
  c for c in filtered_columns if c in result.columns and c not in validated_X.columns
2549
2549
  )
@@ -3813,6 +3813,7 @@ if response.status_code == 200:
3813
3813
  features_meta = self._search_task.get_all_features_metadata_v2()
3814
3814
  if features_meta is None:
3815
3815
  raise Exception(self.bundle.get("missing_features_meta"))
3816
+ features_meta = deepcopy(features_meta)
3816
3817
 
3817
3818
  original_names_dict = {c.name: c.originalName for c in self._search_task.get_file_metadata(trace_id).columns}
3818
3819
  df = df.rename(columns=original_names_dict)
@@ -3839,7 +3840,7 @@ if response.status_code == 200:
3839
3840
  continue
3840
3841
 
3841
3842
  # Temporary workaround for duplicate features metadata
3842
- if feature_meta.name in self.feature_names_:
3843
+ if feature_meta.name in importances:
3843
3844
  self.logger.warning(f"WARNING: Duplicate feature metadata: {feature_meta}")
3844
3845
  continue
3845
3846
 
@@ -3855,6 +3856,7 @@ if response.status_code == 200:
3855
3856
  features_meta = self._search_task.get_all_features_metadata_v2()
3856
3857
  if features_meta is None:
3857
3858
  raise Exception(self.bundle.get("missing_features_meta"))
3859
+ features_meta = deepcopy(features_meta)
3858
3860
 
3859
3861
  original_names_dict = {c.name: c.originalName for c in self._search_task.get_file_metadata(trace_id).columns}
3860
3862
  features_df = self._search_task.get_all_initial_raw_features(trace_id, metrics_calculation=True)
@@ -4040,11 +4042,11 @@ if response.status_code == 200:
4040
4042
  if len(filtered_importances) == 0:
4041
4043
  return []
4042
4044
 
4043
- filtered_importances = list(zip(self.feature_names_, self.feature_importances_))
4044
-
4045
4045
  if importance_threshold is not None:
4046
4046
  filtered_importances = [
4047
- (name, importance) for name, importance in filtered_importances if importance > importance_threshold
4047
+ (name, importance)
4048
+ for name, importance in filtered_importances.items()
4049
+ if importance > importance_threshold
4048
4050
  ]
4049
4051
  if max_features is not None:
4050
4052
  filtered_importances = list(filtered_importances)[:max_features]
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.71a3832.dev10
3
+ Version: 1.2.71a3832.dev12
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -1,9 +1,9 @@
1
- upgini/__about__.py,sha256=qj1UGtuyHfmmi9dqRId3RcPPnrUHFNsbiq_hv1BBucY,34
1
+ upgini/__about__.py,sha256=okx02f-XOrtKlpdtJnV-aHreGFvFkxZ5NQhd5zxvhMk,34
2
2
  upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=aspri7ZAgwkNNUiIgQ1GRXvw8XQii3F4RfNXSrF4wrw,35365
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
- upgini/features_enricher.py,sha256=SMtpkDZqCaTR1u_-TlN_FaqhmbrTwgzjfOi---sFMTs,206583
6
+ upgini/features_enricher.py,sha256=DgWboHEhr5BQT87MaAo2iUtrhapP3iqczLeZtWLRkDs,206664
7
7
  upgini/http.py,sha256=RvzcShpDXssLs6ycGN8xilkKi8ZV9XGUrrk8bwdUzbw,43607
8
8
  upgini/metadata.py,sha256=Yd6iW2f7Wz6vUkg5uvR4xylN16ANnCKVKqAsAkap7p8,12354
9
9
  upgini/metrics.py,sha256=9AaQi7Yb22ZNnycUOAUpcP7TWF5Pfy_NGACcDj10aMs,38820
@@ -70,7 +70,7 @@ upgini/utils/target_utils.py,sha256=b1GzO8_gMcwXSZ2v98CY50MJJBzKbWHId_BJGybXfkM,
70
70
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
71
71
  upgini/utils/ts_utils.py,sha256=26vhC0pN7vLXK6R09EEkMK3Lwb9IVPH7LRdqFIQ3kPs,1383
72
72
  upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
73
- upgini-1.2.71a3832.dev10.dist-info/METADATA,sha256=heO2jdHm4uOBshQhD8CjQuLYR_FNYq7gtzYstHWrDVk,49102
74
- upgini-1.2.71a3832.dev10.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
75
- upgini-1.2.71a3832.dev10.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
76
- upgini-1.2.71a3832.dev10.dist-info/RECORD,,
73
+ upgini-1.2.71a3832.dev12.dist-info/METADATA,sha256=8jmuNEDPwjc-Wa6Bds0FjYqYgqf3LFMYyRGUDy5DME8,49102
74
+ upgini-1.2.71a3832.dev12.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
75
+ upgini-1.2.71a3832.dev12.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
76
+ upgini-1.2.71a3832.dev12.dist-info/RECORD,,