upgini 1.1.294__tar.gz → 1.1.296__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- {upgini-1.1.294 → upgini-1.1.296}/PKG-INFO +1 -1
- upgini-1.1.296/src/upgini/__about__.py +1 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/data_source/data_source_publisher.py +37 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/features_enricher.py +1 -1
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/metrics.py +5 -0
- upgini-1.1.294/src/upgini/__about__.py +0 -1
- {upgini-1.1.294 → upgini-1.1.296}/.gitignore +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/LICENSE +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/README.md +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/pyproject.toml +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/ads.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/ads_management/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/ads_management/ads_manager.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/all_operands.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/binary.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/date.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/feature.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/groupby.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/operand.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/unary.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/autofe/vector.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/data_source/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/dataset.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/errors.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/http.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/lazy_import.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/mdc/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/mdc/context.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/metadata.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/normalizer/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/normalizer/phone_normalizer.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/resource_bundle/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/resource_bundle/exceptions.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/resource_bundle/strings.properties +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/resource_bundle/strings_widget.properties +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/sampler/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/sampler/base.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/sampler/random_under_sampler.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/sampler/utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/search_task.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/spinner.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/__init__.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/base_search_key_detector.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/blocked_time_series.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/country_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/custom_loss_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/cv_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/datetime_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/deduplicate_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/display_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/email_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/fallback_progress_bar.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/features_validator.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/format.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/ip_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/phone_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/postal_code_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/progress_bar.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/sklearn_ext.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/target_utils.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/track_info.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/utils/warning_counter.py +0 -0
- {upgini-1.1.294 → upgini-1.1.296}/src/upgini/version_validator.py +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
__version__ = "1.1.296"
|
|
@@ -59,9 +59,35 @@ class DataSourcePublisher:
|
|
|
59
59
|
features_for_embeddings: Optional[List[str]] = DEFAULT_GENERATE_EMBEDDINGS,
|
|
60
60
|
data_table_id_to_replace: Optional[str] = None,
|
|
61
61
|
keep_features: Optional[List[str]] = None,
|
|
62
|
+
date_features: Optional[List[str]] = None,
|
|
63
|
+
date_vector_features: Optional[List[str]] = None,
|
|
62
64
|
_force_generation=False,
|
|
63
65
|
_silent=False,
|
|
64
66
|
) -> str:
|
|
67
|
+
"""Register new ADS
|
|
68
|
+
|
|
69
|
+
Parameters
|
|
70
|
+
----------
|
|
71
|
+
data_table_uri - str - table name in format {project_id}.{datasource_name}.{table_name}
|
|
72
|
+
|
|
73
|
+
search_keys - dict with column names as keys and SearchKey as value
|
|
74
|
+
|
|
75
|
+
update_frequency - str - (Monthly, Weekly, Daily, Annually, Quarterly)
|
|
76
|
+
|
|
77
|
+
exclude_from_autofe_generation - optional list of features that should be excluded from AutoFE
|
|
78
|
+
|
|
79
|
+
secondary_search_keys - optional dict of secondary search keys
|
|
80
|
+
|
|
81
|
+
sort_column - optional str - name of unique column that could be used for sort
|
|
82
|
+
|
|
83
|
+
date_format - optional str - format of date if it is present in search keys
|
|
84
|
+
|
|
85
|
+
...
|
|
86
|
+
|
|
87
|
+
data_table_id_to_replace - optional str - id of registered ADS that should be replaced by new table
|
|
88
|
+
|
|
89
|
+
keep_features - optional list - features that should not be removed from ADS (even if they are personal)
|
|
90
|
+
"""
|
|
65
91
|
trace_id = str(uuid.uuid4())
|
|
66
92
|
|
|
67
93
|
with MDC(trace_id=trace_id):
|
|
@@ -124,6 +150,14 @@ class DataSourcePublisher:
|
|
|
124
150
|
request["excludeFromGeneration"] = exclude_from_autofe_generation
|
|
125
151
|
if keep_features is not None:
|
|
126
152
|
request["keepFeatures"] = keep_features
|
|
153
|
+
if date_features is not None:
|
|
154
|
+
if date_format is None:
|
|
155
|
+
raise ValidationError("date_format should be presented if you use date features")
|
|
156
|
+
request["dateFeatures"] = date_features
|
|
157
|
+
if date_vector_features is not None:
|
|
158
|
+
if date_format is None:
|
|
159
|
+
raise ValidationError("date_format should be presented if you use date vector features")
|
|
160
|
+
request["dateVectorFeatures"] = date_vector_features
|
|
127
161
|
self.logger.info(f"Start registering data table {request}")
|
|
128
162
|
|
|
129
163
|
task_id = self._rest_client.register_ads(request, trace_id)
|
|
@@ -181,6 +215,9 @@ class DataSourcePublisher:
|
|
|
181
215
|
msg = f"Data table successfully registered with id: {data_table_id}"
|
|
182
216
|
self.logger.info(msg)
|
|
183
217
|
print(msg)
|
|
218
|
+
if "warnings" in status_response and status_response["warnings"]:
|
|
219
|
+
self.logger.warning(status_response["warnings"])
|
|
220
|
+
print(status_response["warnings"])
|
|
184
221
|
return data_table_id
|
|
185
222
|
except KeyboardInterrupt:
|
|
186
223
|
if task_id is not None:
|
|
@@ -2870,7 +2870,7 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
2870
2870
|
self.logger.info(f"Dates interval is ({min_date}, {max_date})")
|
|
2871
2871
|
|
|
2872
2872
|
except Exception:
|
|
2873
|
-
self.logger.
|
|
2873
|
+
self.logger.warning("Failed to log debug information", exc_info=True)
|
|
2874
2874
|
|
|
2875
2875
|
def __handle_index_search_keys(self, df: pd.DataFrame, search_keys: Dict[str, SearchKey]) -> pd.DataFrame:
|
|
2876
2876
|
index_names = df.index.names if df.index.names != [None] else [DEFAULT_INDEX]
|
|
@@ -679,6 +679,11 @@ def validate_scoring_argument(scoring: Union[Callable, str, None]):
|
|
|
679
679
|
raise ValidationError(
|
|
680
680
|
f"Invalid scoring function passed {scoring}. It should accept 3 input arguments: estimator, x, y"
|
|
681
681
|
)
|
|
682
|
+
elif scoring is not None:
|
|
683
|
+
raise ValidationError(
|
|
684
|
+
f"Invalid scoring argument passed {scoring}. It should be string with scoring name or function"
|
|
685
|
+
" that accepts 3 input arguments: estimator, x, y"
|
|
686
|
+
)
|
|
682
687
|
|
|
683
688
|
|
|
684
689
|
def _get_scorer_by_name(scoring: str) -> Tuple[Callable, str, int]:
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
__version__ = "1.1.294"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|