upgini 1.1.197__py3-none-any.whl → 1.1.199__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

@@ -13,7 +13,7 @@ from typing import Any, Callable, Dict, List, Optional, Set, Tuple, Union
13
13
 
14
14
  import numpy as np
15
15
  import pandas as pd
16
- from pandas.api.types import is_string_dtype
16
+ from pandas.api.types import is_numeric_dtype, is_string_dtype
17
17
  from scipy.stats import ks_2samp
18
18
  from sklearn.base import TransformerMixin
19
19
  from sklearn.exceptions import NotFittedError
@@ -946,7 +946,9 @@ class FeaturesEnricher(TransformerMixin):
946
946
  bundle.get("quality_metrics_rows_header"): _num_samples(fitting_X),
947
947
  # bundle.get("quality_metrics_match_rate_header"): self._search_task.initial_max_hit_rate_v2(),
948
948
  }
949
- if model_task_type in [ModelTaskType.BINARY, ModelTaskType.REGRESSION]:
949
+ if model_task_type in [ModelTaskType.BINARY, ModelTaskType.REGRESSION] and is_numeric_dtype(
950
+ y_sorted
951
+ ):
950
952
  train_metrics[bundle.get("quality_metrics_mean_target_header")] = round(y_sorted.mean(), 4)
951
953
  if etalon_metric is not None:
952
954
  train_metrics[bundle.get("quality_metrics_baseline_header").format(metric)] = etalon_metric
@@ -1008,7 +1010,9 @@ class FeaturesEnricher(TransformerMixin):
1008
1010
  bundle.get("quality_metrics_rows_header"): _num_samples(eval_X_sorted),
1009
1011
  # bundle.get("quality_metrics_match_rate_header"): eval_hit_rate,
1010
1012
  }
1011
- if model_task_type in [ModelTaskType.BINARY, ModelTaskType.REGRESSION]:
1013
+ if model_task_type in [ModelTaskType.BINARY, ModelTaskType.REGRESSION] and is_numeric_dtype(
1014
+ eval_y_sorted
1015
+ ):
1012
1016
  eval_metrics[bundle.get("quality_metrics_mean_target_header")] = round(
1013
1017
  eval_y_sorted.mean(), 4
1014
1018
  )
@@ -1204,7 +1208,7 @@ class FeaturesEnricher(TransformerMixin):
1204
1208
  self.logger.info("No external features selected. So use only input datasets for metrics calculation")
1205
1209
  X_sampled, search_keys = self._extend_x(validated_X, is_demo_dataset)
1206
1210
  y_sampled = validated_y
1207
- enriched_X = validated_X
1211
+ enriched_X = X_sampled
1208
1212
  if eval_set is not None:
1209
1213
  for idx in range(len(eval_set)):
1210
1214
  eval_X_sampled, _ = self._extend_x(eval_set[idx][0], is_demo_dataset)
@@ -2315,7 +2319,7 @@ class FeaturesEnricher(TransformerMixin):
2315
2319
  do_without_pandas_limits(print_datasets_sample)
2316
2320
 
2317
2321
  maybe_date_col = self._get_date_column(self.search_keys)
2318
- if X is not None and maybe_date_col is not None:
2322
+ if X is not None and maybe_date_col is not None and maybe_date_col in X.columns:
2319
2323
  min_date = X[maybe_date_col].min()
2320
2324
  max_date = X[maybe_date_col].max()
2321
2325
  self.logger.info(f"Dates interval is ({min_date}, {max_date})")
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: upgini
3
- Version: 1.1.197
3
+ Version: 1.1.199
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Home-page: https://upgini.com/
6
6
  Author: Upgini Developers
@@ -109,7 +109,12 @@ Requires-Dist: ipywidgets (>=8.1.0)
109
109
  <td><a href="https://en.wikipedia.org/wiki/Regression_analysis">☑️ regression</a></td>
110
110
  <td><a href="https://en.wikipedia.org/wiki/Time_series#Prediction_and_forecasting">☑️ time series prediction</a></td>
111
111
  </tr>
112
- </table>
112
+ </table>
113
+
114
+ ⭐️ [Simple Drag & Drop Search UI](https://appwidget-uragwvgykrk4sbmropphpy.streamlit.app/~/+/):
115
+ <a href="https://appwidget-uragwvgykrk4sbmropphpy.streamlit.app/~/+/">
116
+ <img width="710" alt="Drag & Drop Search UI" src="https://github.com/upgini/upgini/assets/95645411/36b6460c-51f3-400e-9f04-445b938bf45e">
117
+ </a>
113
118
 
114
119
 
115
120
  ## 🌎 Connected data sources and coverage
@@ -2,7 +2,7 @@ upgini/__init__.py,sha256=asENHgEVHQBIkV-e_0IhE_ZWqkCG6398U3ZLrNzAH6k,407
2
2
  upgini/ads.py,sha256=mre6xn44wcC_fg63iLT_kTh4mViZqR9AKRJZAtpQz8Y,2592
3
3
  upgini/dataset.py,sha256=hqinFMd0x3hMgFqsRohb2GZvGmoEbdSEgvBjD5n5zaM,47346
4
4
  upgini/errors.py,sha256=BqpvfhW2jJW5fa5KXj0alhXatGl-WK4xTl309-QNLp8,959
5
- upgini/features_enricher.py,sha256=JqR2i8iTfd4IGC1vTt15TGeuUWi6MUlXWuXX9fyMIH0,146312
5
+ upgini/features_enricher.py,sha256=b7yCgyyebhftP1D2Hf-XHSYmteJFniZpjqCTdvtUxuE,146535
6
6
  upgini/fingerprint.js,sha256=VygVIQlN1v4NGZfjHqtRogOw8zjTnnMNJg_f7M5iGQU,33442
7
7
  upgini/http.py,sha256=5t8t9KplLzZQhaoUbxVS-C0-Q78og-aAIUoAn_8dgdw,39538
8
8
  upgini/metadata.py,sha256=9Hm9L7efMGIRSfPUYZ_RUBW7_WMeeTL1fGhylMSvR7w,6135
@@ -45,8 +45,8 @@ upgini/utils/sklearn_ext.py,sha256=IMx2La70AXAggApVpT7sMEjWqVWon5AMZt4MARDsIMQ,4
45
45
  upgini/utils/target_utils.py,sha256=cu52icjhDIPpEStHYMXrD2hIl9gzvfnxZr0Ra5osV0k,1616
46
46
  upgini/utils/track_info.py,sha256=2IGGyHPXBLhWcLO8-Q-5qir52k_kD6DtdU-sv_Z2hHY,5325
47
47
  upgini/utils/warning_counter.py,sha256=vnmdFo5-7GBkU2bK9h_uC0K0Y_wtfcYstxOdeRfacO0,228
48
- upgini-1.1.197.dist-info/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
49
- upgini-1.1.197.dist-info/METADATA,sha256=pqdXxn40GXMVJovcA94byupKZwkukr7Q9RpIQX0HEdk,47985
50
- upgini-1.1.197.dist-info/WHEEL,sha256=G16H4A3IeoQmnOrYV4ueZGKSjhipXx8zc8nu9FGlvMA,92
51
- upgini-1.1.197.dist-info/top_level.txt,sha256=OFhTGiDIWKl5gFI49qvWq1R9IKflPaE2PekcbDXDtx4,7
52
- upgini-1.1.197.dist-info/RECORD,,
48
+ upgini-1.1.199.dist-info/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
49
+ upgini-1.1.199.dist-info/METADATA,sha256=BADcsoeqF6vs1TLz1FX1Q3f6ofqwq-tJqIUzrixJsVQ,48306
50
+ upgini-1.1.199.dist-info/WHEEL,sha256=G16H4A3IeoQmnOrYV4ueZGKSjhipXx8zc8nu9FGlvMA,92
51
+ upgini-1.1.199.dist-info/top_level.txt,sha256=OFhTGiDIWKl5gFI49qvWq1R9IKflPaE2PekcbDXDtx4,7
52
+ upgini-1.1.199.dist-info/RECORD,,