dragon-ml-toolbox 10.12.0__tar.gz → 10.13.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of dragon-ml-toolbox might be problematic. Click here for more details.

Files changed (41) hide show
  1. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/LICENSE +1 -1
  2. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/LICENSE-THIRD-PARTY.md +1 -0
  3. {dragon_ml_toolbox-10.12.0/dragon_ml_toolbox.egg-info → dragon_ml_toolbox-10.13.0}/PKG-INFO +3 -28
  4. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/README.md +0 -21
  5. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0/dragon_ml_toolbox.egg-info}/PKG-INFO +3 -28
  6. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/dragon_ml_toolbox.egg-info/requires.txt +2 -7
  7. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ETL_cleaning.py +5 -3
  8. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ensemble_inference.py +1 -1
  9. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/pyproject.toml +5 -12
  10. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/dragon_ml_toolbox.egg-info/SOURCES.txt +0 -0
  11. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/dragon_ml_toolbox.egg-info/dependency_links.txt +0 -0
  12. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/dragon_ml_toolbox.egg-info/top_level.txt +0 -0
  13. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ETL_engineering.py +0 -0
  14. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/GUI_tools.py +0 -0
  15. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/MICE_imputation.py +0 -0
  16. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_callbacks.py +0 -0
  17. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_datasetmaster.py +0 -0
  18. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_evaluation.py +0 -0
  19. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_evaluation_multi.py +0 -0
  20. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_inference.py +0 -0
  21. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_models.py +0 -0
  22. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_optimization.py +0 -0
  23. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_scaler.py +0 -0
  24. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ML_trainer.py +0 -0
  25. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/PSO_optimization.py +0 -0
  26. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/RNN_forecast.py +0 -0
  27. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/SQL.py +0 -0
  28. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/VIF_factor.py +0 -0
  29. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/__init__.py +0 -0
  30. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/_logger.py +0 -0
  31. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/_script_info.py +0 -0
  32. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/custom_logger.py +0 -0
  33. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/data_exploration.py +0 -0
  34. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ensemble_evaluation.py +0 -0
  35. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/ensemble_learning.py +0 -0
  36. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/handle_excel.py +0 -0
  37. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/keys.py +0 -0
  38. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/optimization_tools.py +0 -0
  39. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/path_manager.py +0 -0
  40. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/ml_tools/utilities.py +0 -0
  41. {dragon_ml_toolbox-10.12.0 → dragon_ml_toolbox-10.13.0}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  MIT License
2
2
 
3
- Copyright (c) 2025 Karl Loza
3
+ Copyright (c) 2025 Karl Luigi Loza Vidaurre
4
4
 
5
5
  Permission is hereby granted, free of charge, to any person obtaining a copy
6
6
  of this software and associated documentation files (the "Software"), to deal
@@ -26,3 +26,4 @@ This project depends on the following third-party packages. Each is governed by
26
26
  - [polars](https://github.com/pola-rs/polars/blob/main/LICENSE)
27
27
  - [plotnine](https://github.com/has2k1/plotnine/blob/main/LICENSE)
28
28
  - [tqdm](https://github.com/tqdm/tqdm/blob/master/LICENSE)
29
+ - [pyarrow](https://github.com/apache/arrow/blob/main/LICENSE.txt)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: dragon-ml-toolbox
3
- Version: 10.12.0
3
+ Version: 10.13.0
4
4
  Summary: A collection of tools for data science and machine learning projects.
5
5
  Author-email: Karl Loza <luigiloza@gmail.com>
6
6
  License-Expression: MIT
@@ -12,12 +12,6 @@ Requires-Python: >=3.10
12
12
  Description-Content-Type: text/markdown
13
13
  License-File: LICENSE
14
14
  License-File: LICENSE-THIRD-PARTY.md
15
- Provides-Extra: base
16
- Requires-Dist: pandas; extra == "base"
17
- Requires-Dist: numpy; extra == "base"
18
- Requires-Dist: polars; extra == "base"
19
- Requires-Dist: joblib; extra == "base"
20
- Requires-Dist: colorlog; extra == "base"
21
15
  Provides-Extra: ml
22
16
  Requires-Dist: numpy>=2.0; extra == "ml"
23
17
  Requires-Dist: pandas; extra == "ml"
@@ -38,6 +32,7 @@ Requires-Dist: shap; extra == "ml"
38
32
  Requires-Dist: tqdm; extra == "ml"
39
33
  Requires-Dist: Pillow; extra == "ml"
40
34
  Requires-Dist: evotorch; extra == "ml"
35
+ Requires-Dist: pyarrow; extra == "ml"
41
36
  Requires-Dist: colorlog; extra == "ml"
42
37
  Provides-Extra: mice
43
38
  Requires-Dist: numpy<2.0; extra == "mice"
@@ -51,6 +46,7 @@ Requires-Dist: statsmodels; extra == "mice"
51
46
  Requires-Dist: lightgbm<=4.5.0; extra == "mice"
52
47
  Requires-Dist: shap; extra == "mice"
53
48
  Requires-Dist: colorlog; extra == "mice"
49
+ Requires-Dist: pyarrow; extra == "mice"
54
50
  Provides-Extra: pytorch
55
51
  Requires-Dist: torch; extra == "pytorch"
56
52
  Requires-Dist: torchvision; extra == "pytorch"
@@ -255,27 +251,6 @@ path_manager
255
251
 
256
252
  ---
257
253
 
258
- ### 🎫 Base Tools [base]
259
-
260
- General purpose functions and classes.
261
-
262
- ```Bash
263
- pip install "dragon-ml-toolbox[base]"
264
- ```
265
-
266
- #### Modules:
267
-
268
- ```Bash
269
- ETL_cleaning
270
- ETL_engineering
271
- custom_logger
272
- SQL
273
- utilities
274
- path_manager
275
- ```
276
-
277
- ---
278
-
279
254
  ### ⚒️ APP bundlers
280
255
 
281
256
  Choose one if needed.
@@ -170,27 +170,6 @@ path_manager
170
170
 
171
171
  ---
172
172
 
173
- ### 🎫 Base Tools [base]
174
-
175
- General purpose functions and classes.
176
-
177
- ```Bash
178
- pip install "dragon-ml-toolbox[base]"
179
- ```
180
-
181
- #### Modules:
182
-
183
- ```Bash
184
- ETL_cleaning
185
- ETL_engineering
186
- custom_logger
187
- SQL
188
- utilities
189
- path_manager
190
- ```
191
-
192
- ---
193
-
194
173
  ### ⚒️ APP bundlers
195
174
 
196
175
  Choose one if needed.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: dragon-ml-toolbox
3
- Version: 10.12.0
3
+ Version: 10.13.0
4
4
  Summary: A collection of tools for data science and machine learning projects.
5
5
  Author-email: Karl Loza <luigiloza@gmail.com>
6
6
  License-Expression: MIT
@@ -12,12 +12,6 @@ Requires-Python: >=3.10
12
12
  Description-Content-Type: text/markdown
13
13
  License-File: LICENSE
14
14
  License-File: LICENSE-THIRD-PARTY.md
15
- Provides-Extra: base
16
- Requires-Dist: pandas; extra == "base"
17
- Requires-Dist: numpy; extra == "base"
18
- Requires-Dist: polars; extra == "base"
19
- Requires-Dist: joblib; extra == "base"
20
- Requires-Dist: colorlog; extra == "base"
21
15
  Provides-Extra: ml
22
16
  Requires-Dist: numpy>=2.0; extra == "ml"
23
17
  Requires-Dist: pandas; extra == "ml"
@@ -38,6 +32,7 @@ Requires-Dist: shap; extra == "ml"
38
32
  Requires-Dist: tqdm; extra == "ml"
39
33
  Requires-Dist: Pillow; extra == "ml"
40
34
  Requires-Dist: evotorch; extra == "ml"
35
+ Requires-Dist: pyarrow; extra == "ml"
41
36
  Requires-Dist: colorlog; extra == "ml"
42
37
  Provides-Extra: mice
43
38
  Requires-Dist: numpy<2.0; extra == "mice"
@@ -51,6 +46,7 @@ Requires-Dist: statsmodels; extra == "mice"
51
46
  Requires-Dist: lightgbm<=4.5.0; extra == "mice"
52
47
  Requires-Dist: shap; extra == "mice"
53
48
  Requires-Dist: colorlog; extra == "mice"
49
+ Requires-Dist: pyarrow; extra == "mice"
54
50
  Provides-Extra: pytorch
55
51
  Requires-Dist: torch; extra == "pytorch"
56
52
  Requires-Dist: torchvision; extra == "pytorch"
@@ -255,27 +251,6 @@ path_manager
255
251
 
256
252
  ---
257
253
 
258
- ### 🎫 Base Tools [base]
259
-
260
- General purpose functions and classes.
261
-
262
- ```Bash
263
- pip install "dragon-ml-toolbox[base]"
264
- ```
265
-
266
- #### Modules:
267
-
268
- ```Bash
269
- ETL_cleaning
270
- ETL_engineering
271
- custom_logger
272
- SQL
273
- utilities
274
- path_manager
275
- ```
276
-
277
- ---
278
-
279
254
  ### ⚒️ APP bundlers
280
255
 
281
256
  Choose one if needed.
@@ -19,13 +19,7 @@ shap
19
19
  tqdm
20
20
  Pillow
21
21
  evotorch
22
- colorlog
23
-
24
- [base]
25
- pandas
26
- numpy
27
- polars
28
- joblib
22
+ pyarrow
29
23
  colorlog
30
24
 
31
25
  [excel]
@@ -61,6 +55,7 @@ statsmodels
61
55
  lightgbm<=4.5.0
62
56
  shap
63
57
  colorlog
58
+ pyarrow
64
59
 
65
60
  [nuitka]
66
61
  nuitka
@@ -142,8 +142,8 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
142
142
  r'[°˚]': '',
143
143
 
144
144
  # Replace special characters in entries
145
- r'\\': '-',
146
- '/': '-',
145
+ r'\\': '_',
146
+ # '/': '_', # keep forward slash
147
147
 
148
148
  # Typographical standardization
149
149
  # Unify various dashes and hyphens to a standard hyphen
@@ -157,6 +157,8 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
157
157
  r'\.{2,}': '.', # Replace two or more dots with a single dot
158
158
  r'\?{2,}': '?', # Replace two or more question marks with a single question mark
159
159
  r'!{2,}': '!', # Replace two or more exclamation marks with a single one
160
+ r';{2,}': ';',
161
+ r'-{2,}': '-',
160
162
 
161
163
  # 2. Internal Whitespace Consolidation
162
164
  # Collapse any sequence of whitespace chars (including non-breaking spaces) to a single space
@@ -168,7 +170,7 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
168
170
 
169
171
  # 4. Textual Null Standardization (New Step)
170
172
  # Convert common null-like text to actual nulls.
171
- r'^(N/A|无|NA|NULL|NONE|NIL|)$': None,
173
+ r'^(N/A|无|NA|NULL|NONE|NIL|-|\.|;)$': None,
172
174
 
173
175
  # 5. Final Nullification of Empty Strings
174
176
  # After all cleaning, if a string is now empty, convert it to a null
@@ -219,7 +219,7 @@ def model_report(
219
219
  return report_data
220
220
 
221
221
 
222
- # Local implementation to avoid calling utilities' dependencies
222
+ # Local implementation to avoid calling utilities dependencies
223
223
  def _deserialize_object(filepath: Union[str,Path], verbose: bool=True, raise_on_error: bool=True) -> Optional[Any]:
224
224
  """
225
225
  Loads a serialized object from a .joblib file.
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "dragon-ml-toolbox"
3
- version = "10.12.0"
3
+ version = "10.13.0"
4
4
  description = "A collection of tools for data science and machine learning projects."
5
5
  authors = [
6
6
  { name = "Karl Loza", email = "luigiloza@gmail.com" }
@@ -19,15 +19,6 @@ Homepage = "https://github.com/DrAg0n-BoRn/ML_tools"
19
19
  Changelog = "https://github.com/DrAg0n-BoRn/ML_tools/blob/master/CHANGELOG.md"
20
20
 
21
21
  [project.optional-dependencies]
22
- # Base all purpose tools
23
- base = [
24
- "pandas",
25
- "numpy",
26
- "polars",
27
- "joblib",
28
- "colorlog"
29
- ]
30
-
31
22
  # Machine Learning main toolbox. Additionally Requires PyTorch with CUDA / MPS support
32
23
  ML = [
33
24
  "numpy>=2.0",
@@ -48,7 +39,8 @@ ML = [
48
39
  "shap",
49
40
  "tqdm",
50
41
  "Pillow",
51
- "evotorch",
42
+ "evotorch",
43
+ "pyarrow",
52
44
  "colorlog"
53
45
  ]
54
46
 
@@ -64,7 +56,8 @@ mice = [
64
56
  "statsmodels",
65
57
  "lightgbm<=4.5.0",
66
58
  "shap",
67
- "colorlog"
59
+ "colorlog",
60
+ "pyarrow"
68
61
  ]
69
62
 
70
63
  # pytorch base CPU installations - not recommended