upgini 1.2.111__py3-none-any.whl → 1.2.113__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
upgini/__about__.py CHANGED
@@ -1 +1 @@
1
- __version__ = "1.2.111"
1
+ __version__ = "1.2.113"
upgini/autofe/date.py CHANGED
@@ -244,7 +244,8 @@ class DateListDiffBounded(DateListDiff, ParametrizedOperator):
244
244
 
245
245
  class DatePercentileBase(PandasOperator, abc.ABC):
246
246
  is_binary: bool = True
247
- output_type: Optional[str] = "float"
247
+ is_categorical: bool = True
248
+ output_type: Optional[str] = "category"
248
249
 
249
250
  date_unit: Optional[str] = None
250
251
 
@@ -254,7 +255,12 @@ class DatePercentileBase(PandasOperator, abc.ABC):
254
255
 
255
256
  bounds = self._get_bounds(left)
256
257
 
257
- return right.index.to_series().apply(lambda i: self._perc(right[i], bounds[i]))
258
+ return (
259
+ right.index.to_series()
260
+ .apply(lambda i: self._perc(right[i], bounds[i]))
261
+ .astype(pd.Int64Dtype())
262
+ .astype("category")
263
+ )
258
264
 
259
265
  @abc.abstractmethod
260
266
  def _get_bounds(self, date_col: pd.Series) -> pd.Series:
upgini/dataset.py CHANGED
@@ -50,7 +50,7 @@ except Exception:
50
50
 
51
51
  class Dataset:
52
52
  MIN_ROWS_COUNT = 100
53
- MAX_ROWS = 200_000
53
+ MAX_ROWS = 100_000
54
54
  IMBALANCE_THESHOLD = 0.6
55
55
  MIN_TARGET_CLASS_ROWS = 100
56
56
  MAX_MULTICLASS_CLASS_COUNT = 100
@@ -22,10 +22,10 @@ MULTICLASS_MIN_SAMPLE_THRESHOLD = 25_000
22
22
  BINARY_BOOTSTRAP_LOOPS = 5
23
23
  MULTICLASS_BOOTSTRAP_LOOPS = 2
24
24
 
25
- FIT_SAMPLE_THRESHOLD = 200_000
26
- FIT_SAMPLE_ROWS = 200_000
27
- FIT_SAMPLE_ROWS_WITH_EVAL_SET = 200_000
28
- FIT_SAMPLE_THRESHOLD_WITH_EVAL_SET = 200_000
25
+ FIT_SAMPLE_THRESHOLD = 100_000
26
+ FIT_SAMPLE_ROWS = 100_000
27
+ FIT_SAMPLE_ROWS_WITH_EVAL_SET = 100_000
28
+ FIT_SAMPLE_THRESHOLD_WITH_EVAL_SET = 100_000
29
29
 
30
30
 
31
31
  @dataclass
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: upgini
3
- Version: 1.2.111
3
+ Version: 1.2.113
4
4
  Summary: Intelligent data search & enrichment for Machine Learning
5
5
  Project-URL: Bug Reports, https://github.com/upgini/upgini/issues
6
6
  Project-URL: Homepage, https://upgini.com/
@@ -874,7 +874,7 @@ Some convenient ways to start contributing are:
874
874
  ⚙️ **Gitpod** [![Gitpod Ready-to-Code](https://img.shields.io/badge/Gitpod-Ready--to--Code-blue?logo=gitpod)](https://gitpod.io/#https://github.com/upgini/upgini) You can use Gitpod to launch a fully functional development environment right in your browser.
875
875
 
876
876
  ## 🔗 Useful links
877
- - [Simple sales predictions as a template notebook](#-simple-sales-predictions-use-as-a-template)
877
+ - [Simple sales predictions as a template notebook](#-simple-sales-prediction-for-retail-stores)
878
878
  - [Full list of Kaggle Guides & Examples](https://www.kaggle.com/romaupgini/code)
879
879
  - [Project on PyPI](https://pypi.org/project/upgini)
880
880
  - [More perks for registered users](https://profile.upgini.com)
@@ -1,7 +1,7 @@
1
- upgini/__about__.py,sha256=4KgOTmI-DrbwzTYsi8NTo4T_nHot9MIavj4EH29sgYA,24
1
+ upgini/__about__.py,sha256=kaFCe2X7oNqZHww74j5Dd4YV4nG48zI57948z7H1dl4,24
2
2
  upgini/__init__.py,sha256=LXSfTNU0HnlOkE69VCxkgIKDhWP-JFo_eBQ71OxTr5Y,261
3
3
  upgini/ads.py,sha256=nvuRxRx5MHDMgPr9SiU-fsqRdFaBv8p4_v1oqiysKpc,2714
4
- upgini/dataset.py,sha256=e6JDYTZ2AwC5aF-dqclKZKkiKrHo2f6cFmMQO2ZZmjM,32724
4
+ upgini/dataset.py,sha256=xFi0a-A3uvtxVwFM6JOyitkEPd1I2slIBj5SWfys3hQ,32724
5
5
  upgini/errors.py,sha256=2b_Wbo0OYhLUbrZqdLIx5jBnAsiD1Mcenh-VjR4HCTw,950
6
6
  upgini/features_enricher.py,sha256=rfVdHgUYEq9saqhWcI04jUmNQcAAn5Kto4w3WpxlOpA,221762
7
7
  upgini/http.py,sha256=zeAZvT6IAzOs9jQ3WG8mJBANLajgvv2LZePFzKz004w,45482
@@ -15,7 +15,7 @@ upgini/ads_management/ads_manager.py,sha256=igVbN2jz80Umb2BUJixmJVj-zx8unoKpecVo
15
15
  upgini/autofe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
16
16
  upgini/autofe/all_operators.py,sha256=rdjF5eaE4bC6Q4eu_el5Z7ekYt8DjOFermz2bePPbUc,333
17
17
  upgini/autofe/binary.py,sha256=oOEECc4nRzZN2tYaiqx8F2XHnfWpk1bVvb7ZkZJ0lO8,7709
18
- upgini/autofe/date.py,sha256=Ga022BUSgXJ4W3P8uWkPNo6k6J0IuEZw6Ezs9KNikPk,11188
18
+ upgini/autofe/date.py,sha256=RvexgrL1_6ISYPVrl9HUQmPgpVSGQsTNv8YhNQWs-5M,11329
19
19
  upgini/autofe/feature.py,sha256=b4Ps_sCPui9b4h0K3ya85cfL1SWpLVrlHc40zkKVfAY,16329
20
20
  upgini/autofe/groupby.py,sha256=IYmQV9uoCdRcpkeWZj_kI3ObzoNCNx3ff3h8sTL01tk,3603
21
21
  upgini/autofe/operator.py,sha256=RB3rKMjFi5Cx81RiYXN3OTCuXjmvzmFKQrxn4h0Oclo,5219
@@ -64,14 +64,14 @@ upgini/utils/mstats.py,sha256=u3gQVUtDRbyrOQK6V1UJ2Rx1QbkSNYGjXa6m3Z_dPVs,6286
64
64
  upgini/utils/phone_utils.py,sha256=IrbztLuOJBiePqqxllfABWfYlfAjYevPhXKipl95wUI,10432
65
65
  upgini/utils/postal_code_utils.py,sha256=5M0sUqH2DAr33kARWCTXR-ACyzWbjDq_-0mmEml6ZcU,1716
66
66
  upgini/utils/progress_bar.py,sha256=N-Sfdah2Hg8lXP_fV9EfUTXz_PyRt4lo9fAHoUDOoLc,1550
67
- upgini/utils/sample_utils.py,sha256=ETLPKQU_YngiYbdlnEoF2h7QS-3oN8et54q3Qs2ZAbA,15417
67
+ upgini/utils/sample_utils.py,sha256=lZJ4yf9Jiq9Em2Ny9m3RIiF7WSxBPrc4E3xxn_8sQk8,15417
68
68
  upgini/utils/sklearn_ext.py,sha256=jLJWAKkqQinV15Z4y1ZnsN3c-fKFwXTsprs00COnyVU,49315
69
69
  upgini/utils/sort.py,sha256=8uuHs2nfSMVnz8GgvbOmgMB1PgEIZP1uhmeRFxcwnYw,7039
70
70
  upgini/utils/target_utils.py,sha256=i3Xt5l9ybB2_nF_ma5cfPuL3OeFTs2dY2xDI0p4Azpg,9049
71
71
  upgini/utils/track_info.py,sha256=G5Lu1xxakg2_TQjKZk4b5SvrHsATTXNVV3NbvWtT8k8,5663
72
72
  upgini/utils/ts_utils.py,sha256=26vhC0pN7vLXK6R09EEkMK3Lwb9IVPH7LRdqFIQ3kPs,1383
73
73
  upgini/utils/warning_counter.py,sha256=-GRY8EUggEBKODPSuXAkHn9KnEQwAORC0mmz_tim-PM,254
74
- upgini-1.2.111.dist-info/METADATA,sha256=FFU_9hZGBiuvJFZpxnlMJVkWlZ4ykBOnA0KcGqOBSyQ,49529
75
- upgini-1.2.111.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
76
- upgini-1.2.111.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
77
- upgini-1.2.111.dist-info/RECORD,,
74
+ upgini-1.2.113.dist-info/METADATA,sha256=p2gvqfKWenNyt1s95-ZalIp6mYCaq0LSVrzphZAQvH4,49528
75
+ upgini-1.2.113.dist-info/WHEEL,sha256=zEMcRr9Kr03x1ozGwg5v9NQBKn3kndp6LSoSlVg-jhU,87
76
+ upgini-1.2.113.dist-info/licenses/LICENSE,sha256=5RRzgvdJUu3BUDfv4bzVU6FqKgwHlIay63pPCSmSgzw,1514
77
+ upgini-1.2.113.dist-info/RECORD,,
@@ -1,4 +1,4 @@
1
1
  Wheel-Version: 1.0
2
- Generator: hatchling 1.25.0
2
+ Generator: hatchling 1.24.2
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any