PyPI - upgini - Versions diffs - 1.2.70a3832.dev3__py3-none-any.whl → 1.2.71a3810.dev2__py3-none-any.whl - Mend

upgini 1.2.70a3832.dev3py3-none-any.whl → 1.2.71a3810.dev2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of upgini might be problematic. Click here for more details.

Files changed (24) hide show

upgini/__about__.py +1 -1
upgini/autofe/date.py +15 -21
upgini/autofe/feature.py +5 -1
upgini/autofe/timeseries/base.py +1 -7
upgini/autofe/timeseries/cross.py +21 -11
upgini/autofe/timeseries/roll.py +2 -7
upgini/autofe/timeseries/trend.py +2 -1
upgini/autofe/unary.py +38 -1
upgini/autofe/utils.py +83 -0
upgini/dataset.py +9 -2
upgini/features_enricher.py +265 -259
upgini/http.py +4 -9
upgini/metadata.py +4 -0
upgini/metrics.py +48 -145
upgini/resource_bundle/strings.properties +1 -1
upgini/search_task.py +7 -1
upgini/utils/deduplicate_utils.py +0 -2
upgini/utils/feature_info.py +1 -2
upgini/utils/mstats.py +1 -1
upgini/utils/sklearn_ext.py +2 -9
{upgini-1.2.70a3832.dev3.dist-info → upgini-1.2.71a3810.dev2.dist-info}/METADATA +6 -8
{upgini-1.2.70a3832.dev3.dist-info → upgini-1.2.71a3810.dev2.dist-info}/RECORD +24 -23
{upgini-1.2.70a3832.dev3.dist-info → upgini-1.2.71a3810.dev2.dist-info}/WHEEL +1 -1
{upgini-1.2.70a3832.dev3.dist-info → upgini-1.2.71a3810.dev2.dist-info}/licenses/LICENSE +0 -0

upgini/http.py CHANGED Viewed

@@ -16,7 +16,6 @@ from typing import Any, Dict, List, Optional, Tuple
 from urllib.parse import urljoin
 import jwt
 # import pandas as pd
 import requests
 from pydantic import BaseModel
@@ -343,9 +342,7 @@ class _RestClient:
         else:
             return self._syncronized_refresh_access_token()
-    def _with_unauth_retry(
-        self, request, try_number: int = 0, need_connection_retry: bool = True, silent: bool = False
-    ):
+    def _with_unauth_retry(self, request, try_number: int = 0, need_connection_retry: bool = True):
         try:
             return request()
         except RequestException as e:
@@ -376,9 +373,8 @@ class _RestClient:
             elif "more than one concurrent search request" in e.message.lower():
                 raise ValidationError(bundle.get("concurrent_request"))
             else:
-                if not silent:
-                    print(e)
-                    show_status_error()
+                print(e)
+                show_status_error()
                 raise e
     @staticmethod
@@ -710,7 +706,6 @@ class _RestClient:
                     silent=True,
                 ),
                 need_connection_retry=False,
-                silent=True,
             )
         except Exception:
             self.send_log_event_unauth(log_event)
@@ -721,7 +716,7 @@ class _RestClient:
         try:
             requests.post(
                 url=urljoin(_RestClient.PROD_BACKEND_URL, api_path),
-                json=log_event.model_dump(exclude_none=True),
+                json=log_event.dict(exclude_none=True),
                 headers=_RestClient._get_base_headers(content_type="application/json"),
             )
         except Exception:

upgini/metadata.py CHANGED Viewed

@@ -325,6 +325,10 @@ class RuntimeParameters(BaseModel):
     properties: Dict[str, Any] = {}
+class AutoFEParameters(BaseModel):
+    ts_gap_days: Optional[int] = None
 class SearchCustomization(BaseModel):
     featuresFilter: Optional[FeaturesFilter] = None
     extractFeatures: Optional[bool] = None

upgini/metrics.py CHANGED Viewed

@@ -1,17 +1,17 @@
 from __future__ import annotations
+from dataclasses import dataclass
 import inspect
 import logging
 import re
-import warnings
 from collections import defaultdict
 from copy import deepcopy
-from dataclasses import dataclass
 from typing import Any, Callable, Dict, List, Optional, Tuple, Union
+import catboost
 import numpy as np
 import pandas as pd
-from lightgbm import LGBMClassifier, LGBMRegressor
+from catboost import CatBoost, CatBoostClassifier, CatBoostRegressor, Pool
 from numpy import log1p
 from pandas.api.types import is_numeric_dtype
 from sklearn.metrics import check_scoring, get_scorer, make_scorer, roc_auc_score
@@ -27,8 +27,11 @@ except ImportError:
     from sklearn.metrics._scorer import SCORERS
     available_scorers = SCORERS
+from sklearn.metrics._regression import (
+    _check_reg_targets,
+    check_consistent_length,
+)
 from sklearn.metrics import mean_squared_error
-from sklearn.metrics._regression import _check_reg_targets, check_consistent_length
 from sklearn.model_selection import BaseCrossValidator
 from upgini.errors import ValidationError
@@ -85,73 +88,11 @@ CATBOOST_MULTICLASS_PARAMS = {
 LIGHTGBM_PARAMS = {
     "random_state": DEFAULT_RANDOM_STATE,
-    # "num_leaves": 16,
-    # "n_estimators": 150,
-    # "min_child_weight": 1,
+    "num_leaves": 16,
     "max_depth": 4,
-    "max_cat_threshold": 80,
-    "min_data_per_group": 25,
-    "num_boost_round": 150,
-    "cat_l2": 10,
-    "cat_smooth": 12,
-    "learning_rate": 0.05,
-    "feature_fraction": 1.0,
-    "min_sum_hessian_in_leaf": 0.01,
-}
-LIGHTGBM_REGRESSION_PARAMS = {
-    "random_state": DEFAULT_RANDOM_STATE,
-    "deterministic": True,
-    "min_gain_to_split": 0.001,
-    "n_estimators": 275,
-    "max_depth": 5,
-    "max_cat_threshold": 80,
-    "min_data_per_group": 25,
-    "cat_l2": 10,
-    "cat_smooth": 12,
+    "n_estimators": 150,
     "learning_rate": 0.05,
-    "feature_fraction": 1.0,
-    "min_sum_hessian_in_leaf": 0.01,
-    "objective": "huber",
-    "verbosity": -1,
-}
-LIGHTGBM_MULTICLASS_PARAMS = {
-    "random_state": DEFAULT_RANDOM_STATE,
-    "deterministic": True,
-    "min_gain_to_split": 0.001,
-    "n_estimators": 275,
-    "max_depth": 3,
-    "max_cat_threshold": 80,
-    "min_data_per_group": 25,
-    "cat_l2": 10,
-    "cat_smooth": 12,
-    "learning_rate": 0.25,  # CatBoost 0.25
-    "min_sum_hessian_in_leaf": 0.01,
-    "class_weight": "balanced",  # TODO pass dict with weights for each class
-    "objective": "multiclass",
-    "use_quantized_grad": "true",
-    "num_grad_quant_bins": "8",
-    "stochastic_rounding": "true",
-    "verbosity": -1,
-}
-LIGHTGBM_BINARY_PARAMS = {
-    "random_state": DEFAULT_RANDOM_STATE,
-    "deterministic": True,
-    "min_gain_to_split": 0.001,
-    "n_estimators": 275,
-    "max_depth": 5,
-    "max_cat_threshold": 80,
-    "min_data_per_group": 25,
-    "cat_l2": 10,
-    "cat_smooth": 12,
-    "learning_rate": 0.05,
-    "feature_fraction": 1.0,
-    "min_sum_hessian_in_leaf": 0.01,
-    "objective": "binary",
-    "class_weight": "balanced",  # TODO pass dict with weights for each class
-    "verbosity": -1,
+    "min_child_weight": 1,
 }
 N_FOLDS = 5
@@ -270,15 +211,6 @@ SUPPORTED_CATBOOST_METRICS = {
 }
-def is_catboost_estimator(estimator):
-    try:
-        from catboost import CatBoostClassifier, CatBoostRegressor
-        return isinstance(estimator, (CatBoostClassifier, CatBoostRegressor))
-    except ImportError:
-        return False
 @dataclass
 class _CrossValResults:
     metric: Optional[float]
@@ -360,7 +292,7 @@ class EstimatorWrapper:
         self.logger.info(f"After preparing data columns: {x.columns.to_list()}")
         return x, y, groups
-    def _remove_empty_target_rows(self, x: pd.DataFrame, y: pd.Series) -> Tuple[pd.DataFrame, np.ndarray]:
+    def _remove_empty_target_rows(self, x: pd.DataFrame, y: pd.Series) -> Tuple[pd.DataFrame, pd.Series]:
         joined = pd.concat([x, y], axis=1)
         joined = joined[joined[y.name].notna()]
         joined = joined.reset_index(drop=True)
@@ -414,15 +346,12 @@ class EstimatorWrapper:
             for estimator, split in zip(self.cv_estimators, splits):
                 _, validation_idx = split
                 cv_x = x.iloc[validation_idx]
-                if isinstance(y, pd.Series):
-                    cv_y = y.iloc[validation_idx]
-                else:
-                    cv_y = y[validation_idx]
+                cv_y = y[validation_idx]
                 shaps = self.calculate_shap(cv_x, cv_y, estimator)
                 if shaps is not None:
                     for feature, shap_value in shaps.items():
                         # shap_values_all_folds[feature] = shap_values_all_folds.get(feature, []) + shap_value.tolist()
-                        shap_values_all_folds[feature].append(shap_value)
+                        shap_values_all_folds[feature].extend(shap_value.tolist())
         if shap_values_all_folds:
             average_shap_values = {
@@ -498,18 +427,21 @@ class EstimatorWrapper:
         }
         if estimator is None:
             params = {}
+            params["has_time"] = has_date
+            # if metric_name.upper() in SUPPORTED_CATBOOST_METRICS:
+            #     params["eval_metric"] = SUPPORTED_CATBOOST_METRICS[metric_name.upper()]
             if target_type == ModelTaskType.MULTICLASS:
-                params = _get_add_params(params, LIGHTGBM_MULTICLASS_PARAMS)
+                params = _get_add_params(params, CATBOOST_MULTICLASS_PARAMS)
                 params = _get_add_params(params, add_params)
-                estimator = LightGBMWrapper(LGBMClassifier(**params), **kwargs)
+                estimator = CatBoostWrapper(CatBoostClassifier(**params), **kwargs)
             elif target_type == ModelTaskType.BINARY:
-                params = _get_add_params(params, LIGHTGBM_BINARY_PARAMS)
+                params = _get_add_params(params, CATBOOST_BINARY_PARAMS)
                 params = _get_add_params(params, add_params)
-                estimator = LightGBMWrapper(LGBMClassifier(**params), **kwargs)
+                estimator = CatBoostWrapper(CatBoostClassifier(**params), **kwargs)
             elif target_type == ModelTaskType.REGRESSION:
-                params = _get_add_params(params, LIGHTGBM_REGRESSION_PARAMS)
+                params = _get_add_params(params, CATBOOST_REGRESSION_PARAMS)
                 params = _get_add_params(params, add_params)
-                estimator = LightGBMWrapper(LGBMRegressor(**params), **kwargs)
+                estimator = CatBoostWrapper(CatBoostRegressor(**params), **kwargs)
             else:
                 raise Exception(bundle.get("metrics_unsupported_target_type").format(target_type))
         else:
@@ -518,21 +450,31 @@ class EstimatorWrapper:
             else:
                 estimator_copy = deepcopy(estimator)
             kwargs["estimator"] = estimator_copy
-            if is_catboost_estimator(estimator):
+            if isinstance(estimator, (CatBoostClassifier, CatBoostRegressor)):
                 if cat_features is not None:
                     for cat_feature in cat_features:
                         if cat_feature not in x.columns:
                             logger.error(
                                 f"Client cat_feature `{cat_feature}` not found in x columns: {x.columns.to_list()}"
                             )
-                    estimator_copy.set_params(cat_features=cat_features, has_time=has_date)
+                    estimator_copy.set_params(
+                        # cat_features=[x.columns.get_loc(cat_feature) for cat_feature in cat_features]
+                        cat_features=cat_features
+                    )
                 estimator = CatBoostWrapper(**kwargs)
             else:
-                if isinstance(estimator, (LGBMClassifier, LGBMRegressor)):
-                    estimator = LightGBMWrapper(**kwargs)
-                elif is_catboost_estimator(estimator):
-                    estimator = CatBoostWrapper(**kwargs)
-                else:
+                try:
+                    from lightgbm import LGBMClassifier, LGBMRegressor
+                    if isinstance(estimator, (LGBMClassifier, LGBMRegressor)):
+                        estimator = LightGBMWrapper(**kwargs)
+                    else:
+                        logger.warning(
+                            f"Unexpected estimator is used for metrics: {estimator}. "
+                            "Default strategy for category features will be used"
+                        )
+                        estimator = OtherEstimatorWrapper(**kwargs)
+                except ModuleNotFoundError:
                     logger.warning(
                         f"Unexpected estimator is used for metrics: {estimator}. "
                         "Default strategy for category features will be used"
@@ -545,7 +487,7 @@ class EstimatorWrapper:
 class CatBoostWrapper(EstimatorWrapper):
     def __init__(
         self,
-        estimator,
+        estimator: Union[CatBoostClassifier, CatBoostRegressor],
         scorer: Callable,
         metric_name: str,
         multiplier: int,
@@ -575,9 +517,6 @@ class CatBoostWrapper(EstimatorWrapper):
         x, y, groups, params = super()._prepare_to_fit(x, y)
         # Find embeddings
-        import catboost
-        from catboost import CatBoostClassifier
         if hasattr(CatBoostClassifier, "get_embedding_feature_indices"):
             emb_pattern = r"(.+)_emb\d+"
             self.emb_features = [c for c in x.columns if re.match(emb_pattern, c) and is_numeric_dtype(x[c])]
@@ -698,10 +637,8 @@ class CatBoostWrapper(EstimatorWrapper):
             else:
                 raise e
-    def calculate_shap(self, x: pd.DataFrame, y: pd.Series, estimator) -> Optional[Dict[str, float]]:
+    def calculate_shap(self, x: pd.DataFrame, y: pd.Series, estimator: CatBoost) -> Optional[Dict[str, float]]:
         try:
-            from catboost import Pool
             # Create Pool for fold data, if need (for example, when categorical features are present)
             fold_pool = Pool(
                 x,
@@ -758,59 +695,25 @@ class LightGBMWrapper(EstimatorWrapper):
         self.cat_features = None
     def _prepare_to_fit(self, x: pd.DataFrame, y: pd.Series) -> Tuple[pd.DataFrame, pd.Series, np.ndarray, dict]:
-        x, y_numpy, groups, params = super()._prepare_to_fit(x, y)
+        x, y, groups, params = super()._prepare_to_fit(x, y)
         self.cat_features = _get_cat_features(x)
         x = fill_na_cat_features(x, self.cat_features)
         for feature in self.cat_features:
             x[feature] = x[feature].astype("category").cat.codes
-        if not is_numeric_dtype(y_numpy):
-            y_numpy = correct_string_target(y_numpy)
+        if not is_numeric_dtype(y):
+            y = correct_string_target(y)
-        return x, y_numpy, groups, params
+        return x, y, groups, params
     def _prepare_to_calculate(self, x: pd.DataFrame, y: pd.Series) -> Tuple[pd.DataFrame, np.ndarray, dict]:
-        x, y_numpy, params = super()._prepare_to_calculate(x, y)
+        x, y, params = super()._prepare_to_calculate(x, y)
         if self.cat_features is not None:
             x = fill_na_cat_features(x, self.cat_features)
             for feature in self.cat_features:
                 x[feature] = x[feature].astype("category").cat.codes
         if not is_numeric_dtype(y):
-            y_numpy = correct_string_target(y_numpy)
-        return x, y_numpy, params
-    def calculate_shap(self, x: pd.DataFrame, y: pd.Series, estimator) -> Optional[Dict[str, float]]:
-        try:
-            # Suppress specific warning from SHAP for LightGBM binary classifier
-            warnings.filterwarnings(
-                "ignore",
-                message=(
-                    "LightGBM binary classifier with TreeExplainer shap values output has changed to a list of ndarray"
-                ),
-            )
-            from shap import TreeExplainer
-            if not isinstance(estimator, (LGBMRegressor, LGBMClassifier)):
-                return None
-            explainer = TreeExplainer(estimator)
-            shap_values = explainer.shap_values(x)
-            # For classification, shap_values is returned as a list for each class
-            # Take values for the positive class
-            if isinstance(shap_values, list):
-                shap_values = shap_values[1]
-            # Calculate mean absolute SHAP value for each feature
-            feature_importance = {}
-            for i, col in enumerate(x.columns):
-                feature_importance[col] = np.mean(np.abs(shap_values[:, i]))
-            return feature_importance
-        except Exception as e:
-            self.logger.warning(f"Failed to calculate SHAP values: {str(e)}")
-            return None
+            y = correct_string_target(y)
+        return x, y, params
 class OtherEstimatorWrapper(EstimatorWrapper):

upgini/resource_bundle/strings.properties CHANGED Viewed

@@ -80,7 +80,6 @@ email_and_hem_simultanious=EMAIL and HEM search keys cannot be used simultaneous
 postal_code_without_country=COUNTRY search key required if POSTAL_CODE is present
 multiple_search_key=Search key {} passed multiple times
 unregistered_only_personal_keys=Only personal search keys used. Api_key from profile.upgini.com required for EMAIL/HEM, PHONE NUMBER or IPv4/IPv6 search keys\nSee docs https://github.com/upgini/upgini#-open-up-all-capabilities-of-upgini
-only_custom_keys=Only CUSTOM_KEY search keys were provided. At least one of DATE, COUNTRY, POSTAL_CODE, PHONE, EMAIL, HEM, IP should be provided
 search_key_not_found=Column `{}` from search_keys was not found in X dataframe: {}
 numeric_search_key_not_found=Index {} in search_keys is out of bounds for {} columns of X dataframe
 unsupported_search_key_type=Unsupported type of key in search_keys: {}
@@ -137,6 +136,7 @@ x_and_eval_x_diff_types=X and eval_set X has different types: {} and {}
 baseline_score_column_not_exists=baseline_score_column {} doesn't exist in input dataframe
 baseline_score_column_has_na=baseline_score_column contains NaN. Clear it and and retry
 missing_features_for_transform=Missing some features for transform that were presented on fit: {}
+missing_target_for_transform=Search contains features on target. Please add y to the call and try again
 missing_id_column=Id column {} not found in X
     # target validation
 empty_target=Target is empty in all rows

upgini/search_task.py CHANGED Viewed

@@ -168,7 +168,13 @@ class SearchTask:
         for meta in self.provider_metadata_v2:
             if meta.features_used_for_embeddings is not None:
                 features_for_transform.update(meta.features_used_for_embeddings)
+            if meta.generated_features:
+                features_for_transform.update(
+                    c.original_name
+                    for f in meta.generated_features
+                    for c in f.base_columns
+                    if c.ads_definition_id is None
+                )
         return list(features_for_transform)
     def get_shuffle_kfold(self) -> Optional[bool]:

upgini/utils/deduplicate_utils.py CHANGED Viewed

@@ -74,8 +74,6 @@ def remove_fintech_duplicates(
         # Checking for different dates by the same personal keys
         uniques = grouped_by_personal_cols[date_col].nunique()
         total = len(uniques)
-        if total == 0:
-            return segment_df, None
         diff_dates = len(uniques[uniques > 1])
         if diff_dates / total >= 0.6:
             return segment_df, None

upgini/utils/feature_info.py CHANGED Viewed

@@ -90,8 +90,7 @@ class FeatureInfo:
 def _get_feature_sample(feature_meta: FeaturesMetadataV2, data: Optional[pd.DataFrame]) -> str:
     if data is not None and len(data) > 0 and feature_meta.name in data.columns:
         if len(data) > 3:
-            rand = np.random.RandomState(42)
-            feature_sample = rand.choice(data[feature_meta.name].dropna().unique(), 3).tolist()
+            feature_sample = np.random.choice(data[feature_meta.name].dropna().unique(), 3).tolist()
         else:
             feature_sample = data[feature_meta.name].dropna().unique().tolist()
         if len(feature_sample) > 0 and isinstance(feature_sample[0], float):

upgini/utils/mstats.py CHANGED Viewed

@@ -118,7 +118,7 @@ def spearmanr(
     # - dof: degrees of freedom
     # - t_stat: t-statistic
     # - alternative: 'two-sided', 'greater', 'less'
-    def compute_t_pvalue(t_stat, dof, alternative='two-sided'):
+    def compute_t_pvalue(t_stat, dof, alternative="two-sided"):
         from scipy.stats import t
         if alternative == "two-sided":

upgini/utils/sklearn_ext.py CHANGED Viewed

@@ -9,6 +9,7 @@ from traceback import format_exc
 import numpy as np
 import scipy.sparse as sp
+from catboost import CatBoostClassifier, CatBoostRegressor
 from joblib import Parallel, logger
 from scipy.sparse import issparse
 from sklearn import config_context, get_config
@@ -341,14 +342,6 @@ def cross_validate(
         raise e
-def is_catboost_estimator(estimator):
-    try:
-        from catboost import CatBoostClassifier, CatBoostRegressor
-        return isinstance(estimator, (CatBoostClassifier, CatBoostRegressor))
-    except ImportError:
-        return False
 def _fit_and_score(
     estimator,
     X,
@@ -504,7 +497,7 @@ def _fit_and_score(
         if y_train is None:
             estimator.fit(X_train, **fit_params)
         else:
-            if is_catboost_estimator(estimator):
+            if isinstance(estimator, (CatBoostClassifier, CatBoostRegressor)):
                 fit_params = fit_params.copy()
                 fit_params["eval_set"] = [(X_test, y_test)]
             estimator.fit(X_train, y_train, **fit_params)

{upgini-1.2.70a3832.dev3.dist-info → upgini-1.2.71a3810.dev2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: upgini
-Version: 1.2.70a3832.dev3
+Version: 1.2.71a3810.dev2
 Summary: Intelligent data search & enrichment for Machine Learning
 Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
 Project-URL: Homepage, https://upgini.com/
@@ -17,20 +17,19 @@ Classifier: Intended Audience :: Science/Research
 Classifier: Intended Audience :: Telecommunications Industry
 Classifier: License :: OSI Approved :: BSD License
 Classifier: Operating System :: OS Independent
-Classifier: Programming Language :: Python :: 3.8
-Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
 Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
 Classifier: Topic :: Scientific/Engineering :: Information Analysis
-Requires-Python: <3.12,>=3.8
+Requires-Python: <3.12,>=3.10
+Requires-Dist: catboost>=1.0.3
 Requires-Dist: fastparquet>=0.8.1
 Requires-Dist: ipywidgets>=8.1.0
 Requires-Dist: jarowinkler>=2.0.0
 Requires-Dist: levenshtein>=0.25.1
-Requires-Dist: lightgbm>=4.6.0
-Requires-Dist: numpy<3.0.0,>=1.19.0
+Requires-Dist: numpy<=1.26.4,>=1.19.0
 Requires-Dist: pandas<3.0.0,>=1.1.0
-Requires-Dist: psutil>=5.9.0
+Requires-Dist: psutil>=6.0.0
 Requires-Dist: pydantic<3.0.0,>1.0.0
 Requires-Dist: pyjwt>=2.8.0
 Requires-Dist: python-bidi==0.4.2
@@ -39,7 +38,6 @@ Requires-Dist: python-json-logger>=3.3.0
 Requires-Dist: requests>=2.8.0
 Requires-Dist: scikit-learn>=1.3.0
 Requires-Dist: scipy>=1.10.0
-Requires-Dist: shap>=0.44.0
 Requires-Dist: xhtml2pdf<0.3.0,>=0.2.11
 Description-Content-Type: text/markdown

{upgini-1.2.70a3832.dev3.dist-info → upgini-1.2.71a3810.dev2.dist-info}/RECORD RENAMED Viewed

@@ -1,14 +1,14 @@
-upgini/__about__.py,sha256=uuivsPy9A1ISVUFLN2as6edeg8kbhfwpyVZyOBxEKu0,33
+upgini/__about__.py,sha256=MTGUBBTe5h0uDXYCCEi_Ls0ph00v8U1H8Ryg234maxU,33
 upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
 upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
-upgini/dataset.py,sha256=1rb6BzyuiQFGVCTDmKL2wox3UFRNjtNaIJOwQnZ801A,34956
+upgini/dataset.py,sha256=nCPfkQIlAanLgCpcmsDfxFXmg99dRm9m0K_ibdLUr-4,35365
 upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
-upgini/features_enricher.py,sha256=4IstUZpQu4gN322LtVvpDMzTiMe5vmtjDr-U17588kk,205808
-upgini/http.py,sha256=RvzcShpDXssLs6ycGN8xilkKi8ZV9XGUrrk8bwdUzbw,43607
+upgini/features_enricher.py,sha256=KqDQ29sU1Aty5Z40DDqO869Y_CClQfmU58nE9rScxRc,204434
+upgini/http.py,sha256=ud0Cp7h0jNeHuuZGpU_1dAAEiabGoJjGxc1X5oeBQr4,43496
 upgini/lazy_import.py,sha256=74gQ8JuA48BGRLxAo7lNHNKY2D2emMxrUxKGdxVGhuY,1012
-upgini/metadata.py,sha256=Jh6YTaS00m_nbaOY_owvlSyn9zgkErkqu8iTr9ZjKI8,12279
-upgini/metrics.py,sha256=I0sVJLNp4fiIq7ZFcUdNTxJjFkzStdFuKbnf2niEGjc,38207
-upgini/search_task.py,sha256=qxUxAD-bed-FpZYmTB_4orW7YJsW_O6a1TcgnZIRFr4,17307
+upgini/metadata.py,sha256=Yd6iW2f7Wz6vUkg5uvR4xylN16ANnCKVKqAsAkap7p8,12354
+upgini/metrics.py,sha256=t7uOOnlDYvP6E3DLjPMQcFBjyhJfUQY8aUlx7N0Mh-s,35477
+upgini/search_task.py,sha256=EuCGp0iCWz2fpuJgN6M47aP_CtIi3Oq9zw78w0mkKiU,17595
 upgini/spinner.py,sha256=4iMd-eIe_BnkqFEMIliULTbj6rNI2HkN_VJ4qYe0cUc,1118
 upgini/version_validator.py,sha256=DvbaAvuYFoJqYt0fitpsk6Xcv-H1BYDJYHUMxaKSH_Y,1509
 upgini/ads_management/__init__.py,sha256=qzyisOToVRP-tquAJD1PblZhNtMrOB8FiyF9JvfkvgE,50
@@ -16,19 +16,20 @@ upgini/ads_management/ads_manager.py,sha256=igVbN2jz80Umb2BUJixmJVj-zx8unoKpecVo
 upgini/autofe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 upgini/autofe/all_operators.py,sha256=rdjF5eaE4bC6Q4eu_el5Z7ekYt8DjOFermz2bePPbUc,333
 upgini/autofe/binary.py,sha256=MnQuFiERpocjCPQUjOljlsq5FE-04GPfwtNjzvfNMyU,7671
-upgini/autofe/date.py,sha256=I07psJerrxOcHao91PdSCk9X6KWu61IBVyFRLjGNgK8,10730
-upgini/autofe/feature.py,sha256=xgu6bVIlUJ5PCUgoXQRNcGkcMOhj-_BdDRmkB_qRFS4,14766
+upgini/autofe/date.py,sha256=C86F7sPiscUGq2a45UtQA9ADWBWg0kt54mePHHzjbLE,10633
+upgini/autofe/feature.py,sha256=y1x3wijhTVBmloayQAHiscqKU9Ll8kLcGm1PdvS357I,14910
 upgini/autofe/groupby.py,sha256=IYmQV9uoCdRcpkeWZj_kI3ObzoNCNx3ff3h8sTL01tk,3603
 upgini/autofe/operator.py,sha256=EOffJw6vKXpEh5yymqb1RFNJPxGxmnHdFRo9dB5SCFo,4969
-upgini/autofe/unary.py,sha256=yVgPvtfnPSOhrii0YgezddmgWPwyOBCR0JutaIkdTTc,4658
+upgini/autofe/unary.py,sha256=_4F3ZyuPUz2nbkJFMJi2Dk5FirGZngUammstgK1Fq34,5720
+upgini/autofe/utils.py,sha256=fK1am2_tQj3fL2vDslblye8lmyfWgGIUOX1beYVBz4k,2420
 upgini/autofe/vector.py,sha256=l0KdKg-txlZxDSE4hPPfCtfGQofYbl7oaABPr830sPI,667
 upgini/autofe/timeseries/__init__.py,sha256=PGwwDAMwvkXl3el12tXVEmZUgDUvlmIPlXtROm6bD18,738
-upgini/autofe/timeseries/base.py,sha256=T9Ec8LKJbiwTUGGsd_xhM0U0NUJblqmKchkzUI1sK88,3755
-upgini/autofe/timeseries/cross.py,sha256=Sh5hAXZFWKaFRqf_JGODu9pWO2tmuV5VKyK9eX3i7-I,4931
+upgini/autofe/timeseries/base.py,sha256=MYK260n3h9kEbgunbyp0cpR0pgNHml3N2WDLGW5BLDU,3603
+upgini/autofe/timeseries/cross.py,sha256=xpHHVITXYUK20BgEZlqKN1Uy2uxKnHz72gngjt7BxVE,5316
 upgini/autofe/timeseries/delta.py,sha256=h0YhmI1TlPJnjwFpN_GQxLb6r59DQuucnG5tQAXSgjU,3520
 upgini/autofe/timeseries/lag.py,sha256=LfQtg484vuqM0mgY4Wft1swHX_Srq7OKKgZswCXoiXI,1882
-upgini/autofe/timeseries/roll.py,sha256=bNFMDszSYTWvB7EyhHbRY1DJqzSURvHlPAcBebt0y0Y,2878
-upgini/autofe/timeseries/trend.py,sha256=9p2Q5ByAi6cx9RH9teBTe8FyjSzqthznC2Lo5dsJ0ho,2051
+upgini/autofe/timeseries/roll.py,sha256=zADKXU-eYWQnQ5R3am1yEal8uU6Tm0jLAixwPb_aCHg,2794
+upgini/autofe/timeseries/trend.py,sha256=K1_iw2ko_LIUU8YCUgrvN3n0MkHtsi7-63-8x9er1k4,2129
 upgini/autofe/timeseries/volatility.py,sha256=9shUmIKjpWTHVYjj80YBsk0XheBJ9uBuLv5NW9Mchnk,7953
 upgini/data_source/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 upgini/data_source/data_source_publisher.py,sha256=4S9qwlAklD8vg9tUU_c1pHE2_glUHAh15-wr5hMwKFw,22879
@@ -38,7 +39,7 @@ upgini/normalizer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
 upgini/normalizer/normalize_utils.py,sha256=Ft2MwSgVoBilXAORAOYAuwPD79GOLfwn4qQE3IUFzzg,7218
 upgini/resource_bundle/__init__.py,sha256=S5F2G47pnJd2LDpmFsjDqEwiKkP8Hm-hcseDbMka6Ko,8345
 upgini/resource_bundle/exceptions.py,sha256=5fRvx0_vWdE1-7HcSgF0tckB4A9AKyf5RiinZkInTsI,621
-upgini/resource_bundle/strings.properties,sha256=XU5ulr5ZDQfGbFk9QdFDzl3oDMaw0eDYCPoEq3ZvIkw,27687
+upgini/resource_bundle/strings.properties,sha256=LDT-jtYlrD1IXvWjFSf-dtvapje0qSrqI9W3v7y2zVo,27646
 upgini/resource_bundle/strings_widget.properties,sha256=gOdqvZWntP2LCza_tyVk1_yRYcG4c04K9sQOAVhF_gw,1577
 upgini/sampler/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 upgini/sampler/base.py,sha256=7GpjYqjOp58vYcJLiX__1R5wjUlyQbxvHJ2klFnup_M,6389
@@ -52,25 +53,25 @@ upgini/utils/country_utils.py,sha256=lY-eXWwFVegdVENFttbvLcgGDjFO17Sex8hd2PyJaRk
 upgini/utils/custom_loss_utils.py,sha256=kieNZYBYZm5ZGBltF1F_jOSF4ea6C29rYuCyiDcqVNY,3857
 upgini/utils/cv_utils.py,sha256=w6FQb9nO8BWDx88EF83NpjPLarK4eR4ia0Wg0kLBJC4,3525
 upgini/utils/datetime_utils.py,sha256=_jq-kn_dGNFfs-DGXcWCGzy9bkplfAjrZ8SsmN28zXc,13535
-upgini/utils/deduplicate_utils.py,sha256=AcMLoObMjhOTQ_fMS1LWy0GKp6WXnZ-FNux_8V3nbZU,8914
+upgini/utils/deduplicate_utils.py,sha256=SMZx9IKIhWI5HqXepfKiQb3uDJrogQZtG6jcWuMo5Z4,8855
 upgini/utils/display_utils.py,sha256=DsBjJ8jEYAh8BPgfAbzq5imoGFV6IACP20PQ78BQCX0,11964
 upgini/utils/email_utils.py,sha256=pZ2vCfNxLIPUhxr0-OlABNXm12jjU44isBk8kGmqQzA,5277
 upgini/utils/fallback_progress_bar.py,sha256=PDaKb8dYpVZaWMroNcOHsTc3pSjgi9mOm0--cOFTwJ0,1074
-upgini/utils/feature_info.py,sha256=Q9HN6A-fvfVD-irFWrmOqqZG9RsUSvh5MTY_k0xu-tE,7287
+upgini/utils/feature_info.py,sha256=m1tQcT3hTChPAiXzpk0WQcEqElj8KgeCifEJFa7-gss,7247
 upgini/utils/features_validator.py,sha256=lEfmk4DoxZ4ooOE1HC0ZXtUb_lFKRFHIrnFULZ4_rL8,3746
 upgini/utils/format.py,sha256=Yv5cvvSs2bOLUzzNu96Pu33VMDNbabio92QepUj41jU,243
 upgini/utils/ip_utils.py,sha256=TSQ_qDsLlVnm09X1HacpabEf_HNqSWpxBF4Sdc2xs08,6580
-upgini/utils/mstats.py,sha256=dLJQr5Ak5BAoV-pDPpnfvMURZVkZ3_v250QzAsSlqY4,6286
+upgini/utils/mstats.py,sha256=u3gQVUtDRbyrOQK6V1UJ2Rx1QbkSNYGjXa6m3Z_dPVs,6286
 upgini/utils/phone_utils.py,sha256=IrbztLuOJBiePqqxllfABWfYlfAjYevPhXKipl95wUI,10432
 upgini/utils/postal_code_utils.py,sha256=5M0sUqH2DAr33kARWCTXR-ACyzWbjDq_-0mmEml6ZcU,1716
 upgini/utils/progress_bar.py,sha256=N-Sfdah2Hg8lXP_fV9EfUTXz_PyRt4lo9fAHoUDOoLc,1550
-upgini/utils/sklearn_ext.py,sha256=E7zfYqBW597LetYXHxyM-i4f8luHsGIuP6mMJ2wtSMs,44661
+upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,44511
 upgini/utils/sort.py,sha256=H79A17NMoHtLbqLCPFx_MBUloLZcDKjOba_H4gCE3t8,6965
 upgini/utils/target_utils.py,sha256=b1GzO8_gMcwXSZ2v98CY50MJJBzKbWHId_BJGybXfkM,16579
 upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
 upgini/utils/ts_utils.py,sha256=26vhC0pN7vLXK6R09EEkMK3Lwb9IVPH7LRdqFIQ3kPs,1383
 upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
-upgini-1.2.70a3832.dev3.dist-info/METADATA,sha256=_eHvyDouLdNk5oiA0DK2HBPVmOqgjwy0Ud76LDaElGU,49149
-upgini-1.2.70a3832.dev3.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
-upgini-1.2.70a3832.dev3.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
-upgini-1.2.70a3832.dev3.dist-info/RECORD,,
+upgini-1.2.71a3810.dev2.dist-info/METADATA,sha256=KShCDNaZiUeH7OC7TETgJwx-UCZ9QWlaMcML-eZPJGY,49075
+upgini-1.2.71a3810.dev2.dist-info/WHEEL,sha256=zEMcRr9Kr03x1ozGwg5v9NQBKn3kndp6LSoSlVg-jhU,87
+upgini-1.2.71a3810.dev2.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
+upgini-1.2.71a3810.dev2.dist-info/RECORD,,

{upgini-1.2.70a3832.dev3.dist-info → upgini-1.2.71a3810.dev2.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: hatchling 1.25.0
+Generator: hatchling 1.24.2
 Root-Is-Purelib: true
 Tag: py3-none-any

{upgini-1.2.70a3832.dev3.dist-info → upgini-1.2.71a3810.dev2.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

upgini 1.2.70a3832.dev3__py3-none-any.whl → 1.2.71a3810.dev2__py3-none-any.whl

Potentially problematic release.

upgini 1.2.70a3832.dev3py3-none-any.whl → 1.2.71a3810.dev2py3-none-any.whl