upgini 1.2.140a4063.dev2__tar.gz → 1.2.142a1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/PKG-INFO +2 -2
- upgini-1.2.142a1/src/upgini/__about__.py +1 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/dataset.py +8 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/features_enricher.py +502 -560
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/metadata.py +2 -1
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/normalizer/normalize_utils.py +1 -1
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/resource_bundle/strings.properties +10 -9
- upgini-1.2.140a4063.dev2/src/upgini/__about__.py +0 -1
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/.gitignore +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/LICENSE +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/README.md +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/pyproject.toml +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/ads.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/ads_management/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/ads_management/ads_manager.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/all_operators.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/binary.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/date.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/feature.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/groupby.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/operator.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/timeseries/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/timeseries/base.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/timeseries/cross.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/timeseries/delta.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/timeseries/lag.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/timeseries/roll.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/timeseries/trend.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/timeseries/volatility.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/unary.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/autofe/vector.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/data_source/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/data_source/data_source_publisher.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/errors.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/http.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/mdc/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/mdc/context.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/metrics.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/normalizer/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/resource_bundle/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/resource_bundle/exceptions.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/resource_bundle/strings_widget.properties +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/sampler/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/sampler/base.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/sampler/random_under_sampler.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/sampler/utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/search_task.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/spinner.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/Roboto-Regular.ttf +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/__init__.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/base_search_key_detector.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/blocked_time_series.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/config.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/country_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/custom_loss_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/cv_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/datetime_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/deduplicate_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/display_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/email_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/fallback_progress_bar.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/feature_info.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/features_validator.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/format.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/hash_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/ip_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/mstats.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/phone_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/postal_code_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/progress_bar.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/psi.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/sample_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/sklearn_ext.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/sort.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/target_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/track_info.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/ts_utils.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/utils/warning_counter.py +0 -0
- {upgini-1.2.140a4063.dev2 → upgini-1.2.142a1}/src/upgini/version_validator.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
Metadata-Version: 2.
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
2
|
Name: upgini
|
|
3
|
-
Version: 1.2.
|
|
3
|
+
Version: 1.2.142a1
|
|
4
4
|
Summary: Intelligent data search & enrichment for Machine Learning
|
|
5
5
|
Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
|
|
6
6
|
Project-URL: Homepage, https://upgini.com/
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
__version__ = "1.2.142a1"
|
|
@@ -36,6 +36,7 @@ from upgini.metadata import (
|
|
|
36
36
|
NumericInterval,
|
|
37
37
|
RuntimeParameters,
|
|
38
38
|
SearchCustomization,
|
|
39
|
+
SearchKey,
|
|
39
40
|
)
|
|
40
41
|
from upgini.resource_bundle import ResourceBundle, get_custom_bundle
|
|
41
42
|
from upgini.search_task import SearchTask
|
|
@@ -76,6 +77,7 @@ class Dataset:
|
|
|
76
77
|
id_columns: Optional[List[str]] = None,
|
|
77
78
|
is_imbalanced: bool = False,
|
|
78
79
|
dropped_columns: Optional[List[str]] = None,
|
|
80
|
+
autodetected_search_keys: Optional[Dict[str, SearchKey]] = None,
|
|
79
81
|
random_state: Optional[int] = None,
|
|
80
82
|
sample_config: Optional[SampleConfig] = None,
|
|
81
83
|
rest_client: Optional[_RestClient] = None,
|
|
@@ -124,6 +126,7 @@ class Dataset:
|
|
|
124
126
|
self.id_columns = id_columns
|
|
125
127
|
self.is_imbalanced = is_imbalanced
|
|
126
128
|
self.dropped_columns = dropped_columns
|
|
129
|
+
self.autodetected_search_keys = autodetected_search_keys
|
|
127
130
|
self.date_column = date_column
|
|
128
131
|
if logger is not None:
|
|
129
132
|
self.logger = logger
|
|
@@ -500,6 +503,10 @@ class Dataset:
|
|
|
500
503
|
|
|
501
504
|
deterministic_digest = file_hash(parquet_file_path)
|
|
502
505
|
|
|
506
|
+
autodetected_search_keys = (
|
|
507
|
+
{k: v.name for k, v in self.autodetected_search_keys.items()} if self.autodetected_search_keys else None
|
|
508
|
+
)
|
|
509
|
+
|
|
503
510
|
return FileMetadata(
|
|
504
511
|
name=self.dataset_name,
|
|
505
512
|
description=self.description,
|
|
@@ -510,6 +517,7 @@ class Dataset:
|
|
|
510
517
|
hierarchicalSubgroupKeys=self.hierarchical_subgroup_keys,
|
|
511
518
|
taskType=self.task_type,
|
|
512
519
|
droppedColumns=self.dropped_columns,
|
|
520
|
+
autodetectedSearchKeys=autodetected_search_keys,
|
|
513
521
|
deterministicDigest=deterministic_digest,
|
|
514
522
|
)
|
|
515
523
|
|