dragon-ml-toolbox 10.0.0__py3-none-any.whl → 10.0.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of dragon-ml-toolbox might be problematic. Click here for more details.
- {dragon_ml_toolbox-10.0.0.dist-info → dragon_ml_toolbox-10.0.1.dist-info}/METADATA +4 -2
- {dragon_ml_toolbox-10.0.0.dist-info → dragon_ml_toolbox-10.0.1.dist-info}/RECORD +7 -7
- ml_tools/ETL_cleaning.py +2 -2
- {dragon_ml_toolbox-10.0.0.dist-info → dragon_ml_toolbox-10.0.1.dist-info}/WHEEL +0 -0
- {dragon_ml_toolbox-10.0.0.dist-info → dragon_ml_toolbox-10.0.1.dist-info}/licenses/LICENSE +0 -0
- {dragon_ml_toolbox-10.0.0.dist-info → dragon_ml_toolbox-10.0.1.dist-info}/licenses/LICENSE-THIRD-PARTY.md +0 -0
- {dragon_ml_toolbox-10.0.0.dist-info → dragon_ml_toolbox-10.0.1.dist-info}/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: dragon-ml-toolbox
|
|
3
|
-
Version: 10.0.
|
|
3
|
+
Version: 10.0.1
|
|
4
4
|
Summary: A collection of tools for data science and machine learning projects.
|
|
5
5
|
Author-email: Karl Loza <luigiloza@gmail.com>
|
|
6
6
|
License-Expression: MIT
|
|
@@ -148,6 +148,7 @@ data_exploration
|
|
|
148
148
|
ensemble_evaluation
|
|
149
149
|
ensemble_inference
|
|
150
150
|
ensemble_learning
|
|
151
|
+
ETL_cleaning
|
|
151
152
|
ETL_engineering
|
|
152
153
|
ML_callbacks
|
|
153
154
|
ML_datasetmaster
|
|
@@ -265,7 +266,8 @@ pip install "dragon-ml-toolbox[base]"
|
|
|
265
266
|
#### Modules:
|
|
266
267
|
|
|
267
268
|
```Bash
|
|
268
|
-
|
|
269
|
+
ETL_cleaning
|
|
270
|
+
ETL_engineering
|
|
269
271
|
custom_logger
|
|
270
272
|
SQL
|
|
271
273
|
utilities
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
dragon_ml_toolbox-10.0.
|
|
2
|
-
dragon_ml_toolbox-10.0.
|
|
3
|
-
ml_tools/ETL_cleaning.py,sha256=
|
|
1
|
+
dragon_ml_toolbox-10.0.1.dist-info/licenses/LICENSE,sha256=2uUFNy7D0TLgHim1K5s3DIJ4q_KvxEXVilnU20cWliY,1066
|
|
2
|
+
dragon_ml_toolbox-10.0.1.dist-info/licenses/LICENSE-THIRD-PARTY.md,sha256=lY4_rJPnLnMu7YBQaY-_iz1JRDcLdQzNCyeLAF1glJY,1837
|
|
3
|
+
ml_tools/ETL_cleaning.py,sha256=g_6BH0amK4aQwX8aEM2z4JYyskjbSg5ktu8n0YbrM3w,14905
|
|
4
4
|
ml_tools/ETL_engineering.py,sha256=sgpIhlFIeId4eSJ-a33MnVuPNXs50msxFWa8-kw2hOI,36369
|
|
5
5
|
ml_tools/GUI_tools.py,sha256=kEQWg-bog3pB5tI22gMGKWaCGHnz9TB2Lvvfhf5F2CI,45412
|
|
6
6
|
ml_tools/MICE_imputation.py,sha256=kVSythWfxJFR4-2mtcYCWQaQ1Oz5yyx_SJu5gjnS7H8,11670
|
|
@@ -30,7 +30,7 @@ ml_tools/keys.py,sha256=HtPG8-MWh89C32A7eIlfuuA-DLwkxGkoDfwR2TGN9CQ,1074
|
|
|
30
30
|
ml_tools/optimization_tools.py,sha256=P3I6lIpvZ8Xf2kX5FvvBKBmrK2pB6idBpkTzfUJxTeE,5073
|
|
31
31
|
ml_tools/path_manager.py,sha256=TJgoqMAryc5F0dal8W_zvJgE1TpOzlskIyYJk614WW4,13809
|
|
32
32
|
ml_tools/utilities.py,sha256=SVMaSDigh6SUoAeig2_sXLLIj5w5mUs5KuVWpHvFDec,19816
|
|
33
|
-
dragon_ml_toolbox-10.0.
|
|
34
|
-
dragon_ml_toolbox-10.0.
|
|
35
|
-
dragon_ml_toolbox-10.0.
|
|
36
|
-
dragon_ml_toolbox-10.0.
|
|
33
|
+
dragon_ml_toolbox-10.0.1.dist-info/METADATA,sha256=aWKOlsr3Ru2rUeadnl_uhKNbjFTPTtYDHv4zg7kcM9c,6968
|
|
34
|
+
dragon_ml_toolbox-10.0.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
35
|
+
dragon_ml_toolbox-10.0.1.dist-info/top_level.txt,sha256=wm-oxax3ciyez6VoO4zsFd-gSok2VipYXnbg3TH9PtU,9
|
|
36
|
+
dragon_ml_toolbox-10.0.1.dist-info/RECORD,,
|
ml_tools/ETL_cleaning.py
CHANGED
|
@@ -140,7 +140,7 @@ def basic_clean(input_filepath: Union[str,Path], output_filepath: Union[str,Path
|
|
|
140
140
|
'®': '',
|
|
141
141
|
'™': '',
|
|
142
142
|
|
|
143
|
-
# Collapse repeating punctuation
|
|
143
|
+
# Collapse repeating punctuation
|
|
144
144
|
r'\.{2,}': '.', # Replace two or more dots with a single dot
|
|
145
145
|
r'\?{2,}': '?', # Replace two or more question marks with a single question mark
|
|
146
146
|
r'!{2,}': '!', # Replace two or more exclamation marks with a single one
|
|
@@ -192,7 +192,7 @@ def basic_clean(input_filepath: Union[str,Path], output_filepath: Union[str,Path
|
|
|
192
192
|
# Save cleaned dataframe
|
|
193
193
|
save_dataframe(df=df_final, save_dir=output_path.parent, filename=output_path.name)
|
|
194
194
|
|
|
195
|
-
_LOGGER.info(f"
|
|
195
|
+
_LOGGER.info(f"Data successfully cleaned.")
|
|
196
196
|
|
|
197
197
|
|
|
198
198
|
########## EXTRACT and CLEAN ##########
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|