upgini 1.2.140a4063.dev2__py3-none-any.whl → 1.2.142__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- upgini/__about__.py +1 -1
- upgini/dataset.py +8 -0
- upgini/features_enricher.py +503 -560
- upgini/metadata.py +2 -1
- upgini/normalizer/normalize_utils.py +1 -1
- upgini/resource_bundle/strings.properties +10 -9
- upgini/utils/datetime_utils.py +7 -4
- {upgini-1.2.140a4063.dev2.dist-info → upgini-1.2.142.dist-info}/METADATA +2 -2
- {upgini-1.2.140a4063.dev2.dist-info → upgini-1.2.142.dist-info}/RECORD +11 -11
- {upgini-1.2.140a4063.dev2.dist-info → upgini-1.2.142.dist-info}/WHEEL +1 -1
- {upgini-1.2.140a4063.dev2.dist-info → upgini-1.2.142.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "1.2.
|
|
1
|
+
__version__ = "1.2.142"
|
upgini/dataset.py
CHANGED
|
@@ -36,6 +36,7 @@ from upgini.metadata import (
|
|
|
36
36
|
NumericInterval,
|
|
37
37
|
RuntimeParameters,
|
|
38
38
|
SearchCustomization,
|
|
39
|
+
SearchKey,
|
|
39
40
|
)
|
|
40
41
|
from upgini.resource_bundle import ResourceBundle, get_custom_bundle
|
|
41
42
|
from upgini.search_task import SearchTask
|
|
@@ -76,6 +77,7 @@ class Dataset:
|
|
|
76
77
|
id_columns: Optional[List[str]] = None,
|
|
77
78
|
is_imbalanced: bool = False,
|
|
78
79
|
dropped_columns: Optional[List[str]] = None,
|
|
80
|
+
autodetected_search_keys: Optional[Dict[str, SearchKey]] = None,
|
|
79
81
|
random_state: Optional[int] = None,
|
|
80
82
|
sample_config: Optional[SampleConfig] = None,
|
|
81
83
|
rest_client: Optional[_RestClient] = None,
|
|
@@ -124,6 +126,7 @@ class Dataset:
|
|
|
124
126
|
self.id_columns = id_columns
|
|
125
127
|
self.is_imbalanced = is_imbalanced
|
|
126
128
|
self.dropped_columns = dropped_columns
|
|
129
|
+
self.autodetected_search_keys = autodetected_search_keys
|
|
127
130
|
self.date_column = date_column
|
|
128
131
|
if logger is not None:
|
|
129
132
|
self.logger = logger
|
|
@@ -500,6 +503,10 @@ class Dataset:
|
|
|
500
503
|
|
|
501
504
|
deterministic_digest = file_hash(parquet_file_path)
|
|
502
505
|
|
|
506
|
+
autodetected_search_keys = (
|
|
507
|
+
{k: v.name for k, v in self.autodetected_search_keys.items()} if self.autodetected_search_keys else None
|
|
508
|
+
)
|
|
509
|
+
|
|
503
510
|
return FileMetadata(
|
|
504
511
|
name=self.dataset_name,
|
|
505
512
|
description=self.description,
|
|
@@ -510,6 +517,7 @@ class Dataset:
|
|
|
510
517
|
hierarchicalSubgroupKeys=self.hierarchical_subgroup_keys,
|
|
511
518
|
taskType=self.task_type,
|
|
512
519
|
droppedColumns=self.dropped_columns,
|
|
520
|
+
autodetectedSearchKeys=autodetected_search_keys,
|
|
513
521
|
deterministicDigest=deterministic_digest,
|
|
514
522
|
)
|
|
515
523
|
|