upgini 1.2.2__py3-none-any.whl → 1.2.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of upgini might be problematic. Click here for more details.

upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.2"
1
+ __version__ = "1.2.4"
upgini/__init__.py CHANGED
@@ -1,11 +1,13 @@
1
1
  import os
2
2
 
3
- from .lazy_import import LazyImport
3
+ from upgini.features_enricher import FeaturesEnricher # noqa: F401
4
+ from upgini.metadata import SearchKey, CVType, RuntimeParameters, ModelTaskType # noqa: F401
5
+ # from .lazy_import import LazyImport
4
6
 
5
7
  os.environ["SETUPTOOLS_USE_DISTUTILS"] = "stdlib"
6
8
 
7
- FeaturesEnricher = LazyImport("upgini.features_enricher", "FeaturesEnricher")
8
- SearchKey = LazyImport("upgini.metadata", "SearchKey")
9
- RuntimeParameters = LazyImport("upgini.metadata", "RuntimeParameters")
10
- CVType = LazyImport("upgini.metadata", "CVType")
11
- ModelTaskType = LazyImport("upgini.metadata", "ModelTaskType")
9
+ # FeaturesEnricher = LazyImport("upgini.features_enricher", "FeaturesEnricher")
10
+ # SearchKey = LazyImport("upgini.metadata", "SearchKey")
11
+ # RuntimeParameters = LazyImport("upgini.metadata", "RuntimeParameters")
12
+ # CVType = LazyImport("upgini.metadata", "CVType")
13
+ # ModelTaskType = LazyImport("upgini.metadata", "ModelTaskType")
upgini/autofe/unary.py CHANGED
@@ -136,7 +136,7 @@ class Norm(PandasOperand):
136
136
  def set_params(self, params: Dict[str, str]):
137
137
  super().set_params(params)
138
138
  if params is not None and "norm" in params:
139
- self.norm = params["norm"]
139
+ self.norm = float(params["norm"])
140
140
  return self
141
141
 
142
142
  def get_params(self) -> Dict[str, Optional[str]]:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.2
3
+ Version: 1.2.4
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -260,7 +260,9 @@ We do dataset verification and cleaning under the hood, but still there are some
260
260
  *Search keys* columns will be used to match records from all potential external data sources / features.
261
261
  Define one or multiple columns as a search keys with `FeaturesEnricher` class initialization.
262
262
  ```python
263
- from upgini import FeaturesEnricher, SearchKey
263
+ from upgini.features_enricher import FeaturesEnricher
264
+ from upgini.metadata import SearchKey
265
+
264
266
  enricher = FeaturesEnricher(
265
267
  search_keys={
266
268
  "subscription_activation_date": SearchKey.DATE,
@@ -346,7 +348,9 @@ enricher = FeaturesEnricher(
346
348
 
347
349
  For the meaning types <tt>SearchKey.DATE</tt>/<tt>SearchKey.DATETIME</tt> with dtypes <tt>object</tt> or <tt>string</tt> you have to clarify date/datetime format by passing <tt>date_format</tt> parameter to `FeaturesEnricher`. For example:
348
350
  ```python
349
- from upgini import FeaturesEnricher, SearchKey
351
+ from upgini.features_enricher import FeaturesEnricher
352
+ from upgini.metadata import SearchKey
353
+
350
354
  enricher = FeaturesEnricher(
351
355
  search_keys={
352
356
  "subscription_activation_date": SearchKey.DATE,
@@ -367,7 +371,9 @@ df["date"] = df.date.astype("datetime64").dt.tz_localize("Europe/Warsaw")
367
371
 
368
372
  Single country for the whole training dataset can be passed with `country_code` parameter:
369
373
  ```python
370
- from upgini import FeaturesEnricher, SearchKey
374
+ from upgini.features_enricher import FeaturesEnricher
375
+ from upgini.metadata import SearchKey
376
+
371
377
  enricher = FeaturesEnricher(
372
378
  search_keys={
373
379
  "subscription_activation_date": SearchKey.DATE,
@@ -386,7 +392,8 @@ Create instance of the `FeaturesEnricher` class and call:
386
392
  Let's try it out!
387
393
  ```python
388
394
  import pandas as pd
389
- from upgini import FeaturesEnricher, SearchKey
395
+ from upgini.features_enricher import FeaturesEnricher
396
+ from upgini.metadata import SearchKey
390
397
 
391
398
  # load labeled training dataset to initiate search
392
399
  train_df = pd.read_csv("customer_churn_prediction_train.csv")
@@ -477,7 +484,9 @@ We detect ML task under the hood based on label column values. Currently we supp
477
484
 
478
485
  But for certain search datasets you can pass parameter to `FeaturesEnricher` with correct ML taks type:
479
486
  ```python
480
- from upgini import ModelTaskType
487
+ from upgini.features_enricher import FeaturesEnricher
488
+ from upgini.metadata import SearchKey, ModelTaskType
489
+
481
490
  enricher = FeaturesEnricher(
482
491
  search_keys={"subscription_activation_date": SearchKey.DATE},
483
492
  model_task_type=ModelTaskType.REGRESSION
@@ -490,7 +499,9 @@ enricher = FeaturesEnricher(
490
499
 
491
500
  To initiate feature search you can pass cross-validation type parameter to `FeaturesEnricher` with time series specific CV type:
492
501
  ```python
493
- from upgini.metadata import CVType
502
+ from upgini.features_enricher import FeaturesEnricher
503
+ from upgini.metadata import SearchKey, CVType
504
+
494
505
  enricher = FeaturesEnricher(
495
506
  search_keys={"sales_date": SearchKey.DATE},
496
507
  cv=CVType.time_series
@@ -624,7 +635,9 @@ But you can easily define new split by passing child of BaseCrossValidator to pa
624
635
 
625
636
  Example with more tips-and-tricks:
626
637
  ```python
627
- from upgini import FeaturesEnricher, SearchKey
638
+ from upgini.features_enricher import FeaturesEnricher
639
+ from upgini.metadata import SearchKey
640
+
628
641
  enricher = FeaturesEnricher(search_keys={"registration_date": SearchKey.DATE})
629
642
 
630
643
  # Fit with default setup for metrics calculation
@@ -797,7 +810,7 @@ You may publish ANY data which you consider as royalty / license free ([Open Dat
797
810
  2. Copy *Upgini API key* from profile and upload your data from Upgini python library with this key:
798
811
  ```python
799
812
  import pandas as pd
800
- from upgini import SearchKey
813
+ from upgini.metadata import SearchKey
801
814
  from upgini.ads import upload_user_ads
802
815
  import os
803
816
  os.environ["UPGINI_API_KEY"] = "your_long_string_api_key_goes_here"
@@ -1,5 +1,5 @@
1
- upgini/__about__.py,sha256=uuf4VNtTNA93fMhoAur9YafzaKJFnczY-H1SSCSuRVQ,22
2
- upgini/__init__.py,sha256=Xs0YFVBu1KUdtZzbStGRPQtLt3YLzJnjx5nIUBlX8BE,415
1
+ upgini/__about__.py,sha256=XBKH8E1LmDxv06U39yqMBbXZapOERFgICEDYZs_kRso,22
2
+ upgini/__init__.py,sha256=M64LwQTBa-5Jz24Zm2h8rWwlKQQ1J8nP7gGgIciS0WU,589
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
4
  upgini/dataset.py,sha256=olZ-OHSfBNoBSCo7R5t7uCLukI2nO7afpx_A-HCiJLk,31067
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
@@ -20,7 +20,7 @@ upgini/autofe/date.py,sha256=OpFc3Al0xO3qlESn2Uokfxw51ArVqmh3xngWwdrsaqE,9762
20
20
  upgini/autofe/feature.py,sha256=gwGWY2UcX_0wHAvfEiu1rRU7GFZyzMWZIaPVcf6kD80,14223
21
21
  upgini/autofe/groupby.py,sha256=r-xl_keZZgm_tpiEoDhjYSkT6NHv7a4cRQR4wJ4uCp8,3263
22
22
  upgini/autofe/operand.py,sha256=uk883RaNqgXqtkaRqA1re1d9OFnnpv0JVvelYx09Yw0,2943
23
- upgini/autofe/unary.py,sha256=aMKgsitM_SnaJWzGfcberTJaqwG7yzAJBkAfsei8pPM,4545
23
+ upgini/autofe/unary.py,sha256=LFtjgL4yU_n062QOm9ZHXPa_Vz-c0BaGWqUeJt_EaL0,4552
24
24
  upgini/autofe/vector.py,sha256=ehcZUDqV71TfbU8EmKfdYp603gS2dJY_-fpr10ho5sI,663
25
25
  upgini/data_source/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
26
26
  upgini/data_source/data_source_publisher.py,sha256=Vg0biG86YB0OEaoxbK9YYrr4yARm11_h3bTWIBgoScA,22115
@@ -57,7 +57,7 @@ upgini/utils/sklearn_ext.py,sha256=13jQS_k7v0aUtudXV6nGUEWjttPQzAW9AFYL5wgEz9k,4
57
57
  upgini/utils/target_utils.py,sha256=BVtDmrmFMKerSUWaNOIEdzsYHIFiODdpnWbE50QDPDc,7864
58
58
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
59
59
  upgini/utils/warning_counter.py,sha256=dIWBB4dI5XRRJZudvIlqlIYKEiwLLPcXarsZuYRt338,227
60
- upgini-1.2.2.dist-info/METADATA,sha256=ebR2S_ee9oODpdVzWouTsjnliU8Cea_hO81mgyebyiE,48228
61
- upgini-1.2.2.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
62
- upgini-1.2.2.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
63
- upgini-1.2.2.dist-info/RECORD,,
60
+ upgini-1.2.4.dist-info/METADATA,sha256=lkpbktCHJa5iZbdcK4ZSxKJgL_dGPYTyLcAT3t16ko0,48607
61
+ upgini-1.2.4.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
62
+ upgini-1.2.4.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
63
+ upgini-1.2.4.dist-info/RECORD,,
File without changes