upgini 1.2.3__py3-none-any.whl → 1.2.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of upgini might be problematic. Click here for more details.
- upgini/__about__.py +1 -1
- upgini/__init__.py +8 -6
- {upgini-1.2.3.dist-info → upgini-1.2.4.dist-info}/METADATA +22 -9
- {upgini-1.2.3.dist-info → upgini-1.2.4.dist-info}/RECORD +6 -6
- {upgini-1.2.3.dist-info → upgini-1.2.4.dist-info}/WHEEL +0 -0
- {upgini-1.2.3.dist-info → upgini-1.2.4.dist-info}/licenses/LICENSE +0 -0
upgini/__about__.py
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "1.2.
|
|
1
|
+
__version__ = "1.2.4"
|
upgini/__init__.py
CHANGED
|
@@ -1,11 +1,13 @@
|
|
|
1
1
|
import os
|
|
2
2
|
|
|
3
|
-
from .
|
|
3
|
+
from upgini.features_enricher import FeaturesEnricher # noqa: F401
|
|
4
|
+
from upgini.metadata import SearchKey, CVType, RuntimeParameters, ModelTaskType # noqa: F401
|
|
5
|
+
# from .lazy_import import LazyImport
|
|
4
6
|
|
|
5
7
|
os.environ["SETUPTOOLS_USE_DISTUTILS"] = "stdlib"
|
|
6
8
|
|
|
7
|
-
FeaturesEnricher = LazyImport("upgini.features_enricher", "FeaturesEnricher")
|
|
8
|
-
SearchKey = LazyImport("upgini.metadata", "SearchKey")
|
|
9
|
-
RuntimeParameters = LazyImport("upgini.metadata", "RuntimeParameters")
|
|
10
|
-
CVType = LazyImport("upgini.metadata", "CVType")
|
|
11
|
-
ModelTaskType = LazyImport("upgini.metadata", "ModelTaskType")
|
|
9
|
+
# FeaturesEnricher = LazyImport("upgini.features_enricher", "FeaturesEnricher")
|
|
10
|
+
# SearchKey = LazyImport("upgini.metadata", "SearchKey")
|
|
11
|
+
# RuntimeParameters = LazyImport("upgini.metadata", "RuntimeParameters")
|
|
12
|
+
# CVType = LazyImport("upgini.metadata", "CVType")
|
|
13
|
+
# ModelTaskType = LazyImport("upgini.metadata", "ModelTaskType")
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.3
|
|
2
2
|
Name: upgini
|
|
3
|
-
Version: 1.2.
|
|
3
|
+
Version: 1.2.4
|
|
4
4
|
Summary: Intelligent data search & enrichment for Machine Learning
|
|
5
5
|
Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
|
|
6
6
|
Project-URL: Homepage, https://upgini.com/
|
|
@@ -260,7 +260,9 @@ We do dataset verification and cleaning under the hood, but still there are some
|
|
|
260
260
|
*Search keys* columns will be used to match records from all potential external data sources / features.
|
|
261
261
|
Define one or multiple columns as a search keys with `FeaturesEnricher` class initialization.
|
|
262
262
|
```python
|
|
263
|
-
from upgini import FeaturesEnricher
|
|
263
|
+
from upgini.features_enricher import FeaturesEnricher
|
|
264
|
+
from upgini.metadata import SearchKey
|
|
265
|
+
|
|
264
266
|
enricher = FeaturesEnricher(
|
|
265
267
|
search_keys={
|
|
266
268
|
"subscription_activation_date": SearchKey.DATE,
|
|
@@ -346,7 +348,9 @@ enricher = FeaturesEnricher(
|
|
|
346
348
|
|
|
347
349
|
For the meaning types <tt>SearchKey.DATE</tt>/<tt>SearchKey.DATETIME</tt> with dtypes <tt>object</tt> or <tt>string</tt> you have to clarify date/datetime format by passing <tt>date_format</tt> parameter to `FeaturesEnricher`. For example:
|
|
348
350
|
```python
|
|
349
|
-
from upgini import FeaturesEnricher
|
|
351
|
+
from upgini.features_enricher import FeaturesEnricher
|
|
352
|
+
from upgini.metadata import SearchKey
|
|
353
|
+
|
|
350
354
|
enricher = FeaturesEnricher(
|
|
351
355
|
search_keys={
|
|
352
356
|
"subscription_activation_date": SearchKey.DATE,
|
|
@@ -367,7 +371,9 @@ df["date"] = df.date.astype("datetime64").dt.tz_localize("Europe/Warsaw")
|
|
|
367
371
|
|
|
368
372
|
Single country for the whole training dataset can be passed with `country_code` parameter:
|
|
369
373
|
```python
|
|
370
|
-
from upgini import FeaturesEnricher
|
|
374
|
+
from upgini.features_enricher import FeaturesEnricher
|
|
375
|
+
from upgini.metadata import SearchKey
|
|
376
|
+
|
|
371
377
|
enricher = FeaturesEnricher(
|
|
372
378
|
search_keys={
|
|
373
379
|
"subscription_activation_date": SearchKey.DATE,
|
|
@@ -386,7 +392,8 @@ Create instance of the `FeaturesEnricher` class and call:
|
|
|
386
392
|
Let's try it out!
|
|
387
393
|
```python
|
|
388
394
|
import pandas as pd
|
|
389
|
-
from upgini import FeaturesEnricher
|
|
395
|
+
from upgini.features_enricher import FeaturesEnricher
|
|
396
|
+
from upgini.metadata import SearchKey
|
|
390
397
|
|
|
391
398
|
# load labeled training dataset to initiate search
|
|
392
399
|
train_df = pd.read_csv("customer_churn_prediction_train.csv")
|
|
@@ -477,7 +484,9 @@ We detect ML task under the hood based on label column values. Currently we supp
|
|
|
477
484
|
|
|
478
485
|
But for certain search datasets you can pass parameter to `FeaturesEnricher` with correct ML taks type:
|
|
479
486
|
```python
|
|
480
|
-
from upgini import
|
|
487
|
+
from upgini.features_enricher import FeaturesEnricher
|
|
488
|
+
from upgini.metadata import SearchKey, ModelTaskType
|
|
489
|
+
|
|
481
490
|
enricher = FeaturesEnricher(
|
|
482
491
|
search_keys={"subscription_activation_date": SearchKey.DATE},
|
|
483
492
|
model_task_type=ModelTaskType.REGRESSION
|
|
@@ -490,7 +499,9 @@ enricher = FeaturesEnricher(
|
|
|
490
499
|
|
|
491
500
|
To initiate feature search you can pass cross-validation type parameter to `FeaturesEnricher` with time series specific CV type:
|
|
492
501
|
```python
|
|
493
|
-
from upgini.
|
|
502
|
+
from upgini.features_enricher import FeaturesEnricher
|
|
503
|
+
from upgini.metadata import SearchKey, CVType
|
|
504
|
+
|
|
494
505
|
enricher = FeaturesEnricher(
|
|
495
506
|
search_keys={"sales_date": SearchKey.DATE},
|
|
496
507
|
cv=CVType.time_series
|
|
@@ -624,7 +635,9 @@ But you can easily define new split by passing child of BaseCrossValidator to pa
|
|
|
624
635
|
|
|
625
636
|
Example with more tips-and-tricks:
|
|
626
637
|
```python
|
|
627
|
-
from upgini import FeaturesEnricher
|
|
638
|
+
from upgini.features_enricher import FeaturesEnricher
|
|
639
|
+
from upgini.metadata import SearchKey
|
|
640
|
+
|
|
628
641
|
enricher = FeaturesEnricher(search_keys={"registration_date": SearchKey.DATE})
|
|
629
642
|
|
|
630
643
|
# Fit with default setup for metrics calculation
|
|
@@ -797,7 +810,7 @@ You may publish ANY data which you consider as royalty / license free ([Open Dat
|
|
|
797
810
|
2. Copy *Upgini API key* from profile and upload your data from Upgini python library with this key:
|
|
798
811
|
```python
|
|
799
812
|
import pandas as pd
|
|
800
|
-
from upgini import SearchKey
|
|
813
|
+
from upgini.metadata import SearchKey
|
|
801
814
|
from upgini.ads import upload_user_ads
|
|
802
815
|
import os
|
|
803
816
|
os.environ["UPGINI_API_KEY"] = "your_long_string_api_key_goes_here"
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
upgini/__about__.py,sha256=
|
|
2
|
-
upgini/__init__.py,sha256=
|
|
1
|
+
upgini/__about__.py,sha256=XBKH8E1LmDxv06U39yqMBbXZapOERFgICEDYZs_kRso,22
|
|
2
|
+
upgini/__init__.py,sha256=M64LwQTBa-5Jz24Zm2h8rWwlKQQ1J8nP7gGgIciS0WU,589
|
|
3
3
|
upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
|
|
4
4
|
upgini/dataset.py,sha256=olZ-OHSfBNoBSCo7R5t7uCLukI2nO7afpx_A-HCiJLk,31067
|
|
5
5
|
upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
|
|
@@ -57,7 +57,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
|
|
|
57
57
|
upgini/utils/target_utils.py,sha256=BVtDmrmFMKerSUWaNOIEdzsYHIFiODdpnWbE50QDPDc,7864
|
|
58
58
|
upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
|
|
59
59
|
upgini/utils/warning_counter.py,sha256=dIWBB4dI5XRRJZudvIlqlIYKEiwLLPcXarsZuYRt338,227
|
|
60
|
-
upgini-1.2.
|
|
61
|
-
upgini-1.2.
|
|
62
|
-
upgini-1.2.
|
|
63
|
-
upgini-1.2.
|
|
60
|
+
upgini-1.2.4.dist-info/METADATA,sha256=lkpbktCHJa5iZbdcK4ZSxKJgL_dGPYTyLcAT3t16ko0,48607
|
|
61
|
+
upgini-1.2.4.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
|
|
62
|
+
upgini-1.2.4.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
|
|
63
|
+
upgini-1.2.4.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|