dragon-ml-toolbox 10.12.0__py3-none-any.whl → 10.13.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of dragon-ml-toolbox might be problematic. Click here for more details.
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.13.0.dist-info}/METADATA +3 -28
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.13.0.dist-info}/RECORD +8 -8
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.13.0.dist-info}/licenses/LICENSE +1 -1
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.13.0.dist-info}/licenses/LICENSE-THIRD-PARTY.md +1 -0
- ml_tools/ETL_cleaning.py +5 -3
- ml_tools/ensemble_inference.py +1 -1
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.13.0.dist-info}/WHEEL +0 -0
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.13.0.dist-info}/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: dragon-ml-toolbox
|
|
3
|
-
Version: 10.
|
|
3
|
+
Version: 10.13.0
|
|
4
4
|
Summary: A collection of tools for data science and machine learning projects.
|
|
5
5
|
Author-email: Karl Loza <luigiloza@gmail.com>
|
|
6
6
|
License-Expression: MIT
|
|
@@ -12,12 +12,6 @@ Requires-Python: >=3.10
|
|
|
12
12
|
Description-Content-Type: text/markdown
|
|
13
13
|
License-File: LICENSE
|
|
14
14
|
License-File: LICENSE-THIRD-PARTY.md
|
|
15
|
-
Provides-Extra: base
|
|
16
|
-
Requires-Dist: pandas; extra == "base"
|
|
17
|
-
Requires-Dist: numpy; extra == "base"
|
|
18
|
-
Requires-Dist: polars; extra == "base"
|
|
19
|
-
Requires-Dist: joblib; extra == "base"
|
|
20
|
-
Requires-Dist: colorlog; extra == "base"
|
|
21
15
|
Provides-Extra: ml
|
|
22
16
|
Requires-Dist: numpy>=2.0; extra == "ml"
|
|
23
17
|
Requires-Dist: pandas; extra == "ml"
|
|
@@ -38,6 +32,7 @@ Requires-Dist: shap; extra == "ml"
|
|
|
38
32
|
Requires-Dist: tqdm; extra == "ml"
|
|
39
33
|
Requires-Dist: Pillow; extra == "ml"
|
|
40
34
|
Requires-Dist: evotorch; extra == "ml"
|
|
35
|
+
Requires-Dist: pyarrow; extra == "ml"
|
|
41
36
|
Requires-Dist: colorlog; extra == "ml"
|
|
42
37
|
Provides-Extra: mice
|
|
43
38
|
Requires-Dist: numpy<2.0; extra == "mice"
|
|
@@ -51,6 +46,7 @@ Requires-Dist: statsmodels; extra == "mice"
|
|
|
51
46
|
Requires-Dist: lightgbm<=4.5.0; extra == "mice"
|
|
52
47
|
Requires-Dist: shap; extra == "mice"
|
|
53
48
|
Requires-Dist: colorlog; extra == "mice"
|
|
49
|
+
Requires-Dist: pyarrow; extra == "mice"
|
|
54
50
|
Provides-Extra: pytorch
|
|
55
51
|
Requires-Dist: torch; extra == "pytorch"
|
|
56
52
|
Requires-Dist: torchvision; extra == "pytorch"
|
|
@@ -255,27 +251,6 @@ path_manager
|
|
|
255
251
|
|
|
256
252
|
---
|
|
257
253
|
|
|
258
|
-
### 🎫 Base Tools [base]
|
|
259
|
-
|
|
260
|
-
General purpose functions and classes.
|
|
261
|
-
|
|
262
|
-
```Bash
|
|
263
|
-
pip install "dragon-ml-toolbox[base]"
|
|
264
|
-
```
|
|
265
|
-
|
|
266
|
-
#### Modules:
|
|
267
|
-
|
|
268
|
-
```Bash
|
|
269
|
-
ETL_cleaning
|
|
270
|
-
ETL_engineering
|
|
271
|
-
custom_logger
|
|
272
|
-
SQL
|
|
273
|
-
utilities
|
|
274
|
-
path_manager
|
|
275
|
-
```
|
|
276
|
-
|
|
277
|
-
---
|
|
278
|
-
|
|
279
254
|
### ⚒️ APP bundlers
|
|
280
255
|
|
|
281
256
|
Choose one if needed.
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
dragon_ml_toolbox-10.
|
|
2
|
-
dragon_ml_toolbox-10.
|
|
3
|
-
ml_tools/ETL_cleaning.py,sha256=
|
|
1
|
+
dragon_ml_toolbox-10.13.0.dist-info/licenses/LICENSE,sha256=L35WDmmLZNTlJvxF6Vy7Uy4SYNi6rCfWUqlTHpoRMoU,1081
|
|
2
|
+
dragon_ml_toolbox-10.13.0.dist-info/licenses/LICENSE-THIRD-PARTY.md,sha256=iy2r_R7wjzsCbz_Q_jMsp_jfZ6oP8XW9QhwzRBH0mGY,1904
|
|
3
|
+
ml_tools/ETL_cleaning.py,sha256=mkbcSTBspGWnHQUAj6hNqJdZ4VXLPFNk1qEY-8rmnZ8,19368
|
|
4
4
|
ml_tools/ETL_engineering.py,sha256=a6KCWH6kRatZtjaFEF_o917ApPMK5_vRD-BjfCDAl-E,49400
|
|
5
5
|
ml_tools/GUI_tools.py,sha256=kEQWg-bog3pB5tI22gMGKWaCGHnz9TB2Lvvfhf5F2CI,45412
|
|
6
6
|
ml_tools/MICE_imputation.py,sha256=kVSythWfxJFR4-2mtcYCWQaQ1Oz5yyx_SJu5gjnS7H8,11670
|
|
@@ -23,14 +23,14 @@ ml_tools/_script_info.py,sha256=21r83LV3RubsNZ_RTEUON6RbDf7Mh4_udweNcvdF_Fk,212
|
|
|
23
23
|
ml_tools/custom_logger.py,sha256=ry43hk54K6xKo8jRAgq1sFxUpOA9T0LIJ7sw0so2BW0,5880
|
|
24
24
|
ml_tools/data_exploration.py,sha256=-aTi5jmv4AepPgi2k_85qEJsSLx5zPOtTbhorqzUvGQ,38542
|
|
25
25
|
ml_tools/ensemble_evaluation.py,sha256=FGHSe8LBI8_w8LjNeJWOcYQ1UK_mc6fVah8gmSvNVGg,26853
|
|
26
|
-
ml_tools/ensemble_inference.py,sha256=
|
|
26
|
+
ml_tools/ensemble_inference.py,sha256=Hun_ipIZaaLrHxSo63J6NKS_O1fMWi_6HkuSHs4RywI,9349
|
|
27
27
|
ml_tools/ensemble_learning.py,sha256=3s0kH4i_naj0IVl_T4knst-Hwg4TScWjEdsXX5KAi7I,21929
|
|
28
28
|
ml_tools/handle_excel.py,sha256=He4UT15sCGhaG-JKfs7uYVAubxWjrqgJ6U7OhMR2fuE,14005
|
|
29
29
|
ml_tools/keys.py,sha256=FDpbS3Jb0pjrVvvp2_8nZi919mbob_-xwuy5OOtKM_A,1848
|
|
30
30
|
ml_tools/optimization_tools.py,sha256=P3I6lIpvZ8Xf2kX5FvvBKBmrK2pB6idBpkTzfUJxTeE,5073
|
|
31
31
|
ml_tools/path_manager.py,sha256=ke0MYOhYheRPX599GUbrvRsYHn2JKUmMDldS5LP6LQA,18431
|
|
32
32
|
ml_tools/utilities.py,sha256=uheMUjQJ1zI69gASsE-mCq4KlRPVGgrgqson02rGNYM,30755
|
|
33
|
-
dragon_ml_toolbox-10.
|
|
34
|
-
dragon_ml_toolbox-10.
|
|
35
|
-
dragon_ml_toolbox-10.
|
|
36
|
-
dragon_ml_toolbox-10.
|
|
33
|
+
dragon_ml_toolbox-10.13.0.dist-info/METADATA,sha256=6WXvcXmw1klTCInH807lZGyWg6cjgmoV6uEeKsBqlq8,6608
|
|
34
|
+
dragon_ml_toolbox-10.13.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
35
|
+
dragon_ml_toolbox-10.13.0.dist-info/top_level.txt,sha256=wm-oxax3ciyez6VoO4zsFd-gSok2VipYXnbg3TH9PtU,9
|
|
36
|
+
dragon_ml_toolbox-10.13.0.dist-info/RECORD,,
|
|
@@ -26,3 +26,4 @@ This project depends on the following third-party packages. Each is governed by
|
|
|
26
26
|
- [polars](https://github.com/pola-rs/polars/blob/main/LICENSE)
|
|
27
27
|
- [plotnine](https://github.com/has2k1/plotnine/blob/main/LICENSE)
|
|
28
28
|
- [tqdm](https://github.com/tqdm/tqdm/blob/master/LICENSE)
|
|
29
|
+
- [pyarrow](https://github.com/apache/arrow/blob/main/LICENSE.txt)
|
ml_tools/ETL_cleaning.py
CHANGED
|
@@ -142,8 +142,8 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
|
|
|
142
142
|
r'[°˚]': '',
|
|
143
143
|
|
|
144
144
|
# Replace special characters in entries
|
|
145
|
-
r'\\': '
|
|
146
|
-
'/': '
|
|
145
|
+
r'\\': '_',
|
|
146
|
+
# '/': '_', # keep forward slash
|
|
147
147
|
|
|
148
148
|
# Typographical standardization
|
|
149
149
|
# Unify various dashes and hyphens to a standard hyphen
|
|
@@ -157,6 +157,8 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
|
|
|
157
157
|
r'\.{2,}': '.', # Replace two or more dots with a single dot
|
|
158
158
|
r'\?{2,}': '?', # Replace two or more question marks with a single question mark
|
|
159
159
|
r'!{2,}': '!', # Replace two or more exclamation marks with a single one
|
|
160
|
+
r';{2,}': ';',
|
|
161
|
+
r'-{2,}': '-',
|
|
160
162
|
|
|
161
163
|
# 2. Internal Whitespace Consolidation
|
|
162
164
|
# Collapse any sequence of whitespace chars (including non-breaking spaces) to a single space
|
|
@@ -168,7 +170,7 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
|
|
|
168
170
|
|
|
169
171
|
# 4. Textual Null Standardization (New Step)
|
|
170
172
|
# Convert common null-like text to actual nulls.
|
|
171
|
-
r'^(N/A|无|NA|NULL|NONE|NIL
|
|
173
|
+
r'^(N/A|无|NA|NULL|NONE|NIL|-|\.|;)$': None,
|
|
172
174
|
|
|
173
175
|
# 5. Final Nullification of Empty Strings
|
|
174
176
|
# After all cleaning, if a string is now empty, convert it to a null
|
ml_tools/ensemble_inference.py
CHANGED
|
@@ -219,7 +219,7 @@ def model_report(
|
|
|
219
219
|
return report_data
|
|
220
220
|
|
|
221
221
|
|
|
222
|
-
# Local implementation to avoid calling utilities
|
|
222
|
+
# Local implementation to avoid calling utilities dependencies
|
|
223
223
|
def _deserialize_object(filepath: Union[str,Path], verbose: bool=True, raise_on_error: bool=True) -> Optional[Any]:
|
|
224
224
|
"""
|
|
225
225
|
Loads a serialized object from a .joblib file.
|
|
File without changes
|
|
File without changes
|