upgini 1.1.296a3521.dev9__tar.gz → 1.1.296a3521.dev10__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/PKG-INFO +1 -1
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/pyproject.toml +1 -0
- upgini-1.1.296a3521.dev10/src/upgini/__about__.py +1 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/feature.py +1 -1
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/data_source/data_source_publisher.py +37 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/features_enricher.py +1 -1
- upgini-1.1.296a3521.dev9/src/upgini/__about__.py +0 -1
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/.gitignore +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/LICENSE +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/README.md +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/ads.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/ads_management/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/ads_management/ads_manager.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/all_operands.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/binary.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/date.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/groupby.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/operand.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/unary.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/autofe/vector.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/data_source/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/dataset.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/errors.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/http.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/lazy_import.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/mdc/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/mdc/context.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/metadata.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/metrics.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/normalizer/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/normalizer/phone_normalizer.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/resource_bundle/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/resource_bundle/exceptions.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/resource_bundle/strings.properties +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/resource_bundle/strings_widget.properties +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/sampler/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/sampler/base.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/sampler/random_under_sampler.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/sampler/utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/search_task.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/spinner.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/__init__.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/base_search_key_detector.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/blocked_time_series.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/country_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/custom_loss_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/cv_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/datetime_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/deduplicate_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/display_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/email_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/fallback_progress_bar.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/features_validator.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/format.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/ip_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/phone_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/postal_code_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/progress_bar.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/sklearn_ext.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/target_utils.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/track_info.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/warning_counter.py +0 -0
- {upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/version_validator.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.3
|
|
2
2
|
Name: upgini
|
|
3
|
-
Version: 1.1.296a3521.
|
|
3
|
+
Version: 1.1.296a3521.dev10
|
|
4
4
|
Summary: Intelligent data search & enrichment for Machine Learning
|
|
5
5
|
Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
|
|
6
6
|
Project-URL: Homepage, https://upgini.com/
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
__version__ = "1.1.296a3521.dev10"
|
|
@@ -146,7 +146,7 @@ class Feature:
|
|
|
146
146
|
elif shorten and not self.op.is_unary:
|
|
147
147
|
components = ["f_autofe", self.get_op_display_name()]
|
|
148
148
|
else:
|
|
149
|
-
components = ["f_" + "_f_".join(self.get_columns())] + [
|
|
149
|
+
components = ["f_" + "_f_".join(self.get_columns(**kwargs))] + [
|
|
150
150
|
"autofe",
|
|
151
151
|
self.get_op_display_name(),
|
|
152
152
|
]
|
|
@@ -59,9 +59,35 @@ class DataSourcePublisher:
|
|
|
59
59
|
features_for_embeddings: Optional[List[str]] = DEFAULT_GENERATE_EMBEDDINGS,
|
|
60
60
|
data_table_id_to_replace: Optional[str] = None,
|
|
61
61
|
keep_features: Optional[List[str]] = None,
|
|
62
|
+
date_features: Optional[List[str]] = None,
|
|
63
|
+
date_vector_features: Optional[List[str]] = None,
|
|
62
64
|
_force_generation=False,
|
|
63
65
|
_silent=False,
|
|
64
66
|
) -> str:
|
|
67
|
+
"""Register new ADS
|
|
68
|
+
|
|
69
|
+
Parameters
|
|
70
|
+
----------
|
|
71
|
+
data_table_uri - str - table name in format {project_id}.{datasource_name}.{table_name}
|
|
72
|
+
|
|
73
|
+
search_keys - dict with column names as keys and SearchKey as value
|
|
74
|
+
|
|
75
|
+
update_frequency - str - (Monthly, Weekly, Daily, Annually, Quarterly)
|
|
76
|
+
|
|
77
|
+
exclude_from_autofe_generation - optional list of features that should be excluded from AutoFE
|
|
78
|
+
|
|
79
|
+
secondary_search_keys - optional dict of secondary search keys
|
|
80
|
+
|
|
81
|
+
sort_column - optional str - name of unique column that could be used for sort
|
|
82
|
+
|
|
83
|
+
date_format - optional str - format of date if it is present in search keys
|
|
84
|
+
|
|
85
|
+
...
|
|
86
|
+
|
|
87
|
+
data_table_id_to_replace - optional str - id of registered ADS that should be replaced by new table
|
|
88
|
+
|
|
89
|
+
keep_features - optional list - features that should not be removed from ADS (even if they are personal)
|
|
90
|
+
"""
|
|
65
91
|
trace_id = str(uuid.uuid4())
|
|
66
92
|
|
|
67
93
|
with MDC(trace_id=trace_id):
|
|
@@ -124,6 +150,14 @@ class DataSourcePublisher:
|
|
|
124
150
|
request["excludeFromGeneration"] = exclude_from_autofe_generation
|
|
125
151
|
if keep_features is not None:
|
|
126
152
|
request["keepFeatures"] = keep_features
|
|
153
|
+
if date_features is not None:
|
|
154
|
+
if date_format is None:
|
|
155
|
+
raise ValidationError("date_format should be presented if you use date features")
|
|
156
|
+
request["dateFeatures"] = date_features
|
|
157
|
+
if date_vector_features is not None:
|
|
158
|
+
if date_format is None:
|
|
159
|
+
raise ValidationError("date_format should be presented if you use date vector features")
|
|
160
|
+
request["dateVectorFeatures"] = date_vector_features
|
|
127
161
|
self.logger.info(f"Start registering data table {request}")
|
|
128
162
|
|
|
129
163
|
task_id = self._rest_client.register_ads(request, trace_id)
|
|
@@ -181,6 +215,9 @@ class DataSourcePublisher:
|
|
|
181
215
|
msg = f"Data table successfully registered with id: {data_table_id}"
|
|
182
216
|
self.logger.info(msg)
|
|
183
217
|
print(msg)
|
|
218
|
+
if "warnings" in status_response and status_response["warnings"]:
|
|
219
|
+
self.logger.warning(status_response["warnings"])
|
|
220
|
+
print(status_response["warnings"])
|
|
184
221
|
return data_table_id
|
|
185
222
|
except KeyboardInterrupt:
|
|
186
223
|
if task_id is not None:
|
|
@@ -2870,7 +2870,7 @@ class FeaturesEnricher(TransformerMixin):
|
|
|
2870
2870
|
self.logger.info(f"Dates interval is ({min_date}, {max_date})")
|
|
2871
2871
|
|
|
2872
2872
|
except Exception:
|
|
2873
|
-
self.logger.
|
|
2873
|
+
self.logger.warning("Failed to log debug information", exc_info=True)
|
|
2874
2874
|
|
|
2875
2875
|
def __handle_index_search_keys(self, df: pd.DataFrame, search_keys: Dict[str, SearchKey]) -> pd.DataFrame:
|
|
2876
2876
|
index_names = df.index.names if df.index.names != [None] else [DEFAULT_INDEX]
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
__version__ = "1.1.296a3521.dev9"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/ads_management/__init__.py
RENAMED
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/ads_management/ads_manager.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/normalizer/phone_normalizer.py
RENAMED
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/resource_bundle/__init__.py
RENAMED
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/resource_bundle/exceptions.py
RENAMED
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/resource_bundle/strings.properties
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/sampler/random_under_sampler.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/base_search_key_detector.py
RENAMED
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/blocked_time_series.py
RENAMED
|
File without changes
|
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/custom_loss_utils.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/deduplicate_utils.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/fallback_progress_bar.py
RENAMED
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/features_validator.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{upgini-1.1.296a3521.dev9 → upgini-1.1.296a3521.dev10}/src/upgini/utils/postal_code_utils.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|