dragon-ml-toolbox 10.12.0__py3-none-any.whl → 10.12.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of dragon-ml-toolbox might be problematic. Click here for more details.
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.12.1.dist-info}/METADATA +1 -1
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.12.1.dist-info}/RECORD +7 -7
- ml_tools/ETL_cleaning.py +5 -3
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.12.1.dist-info}/WHEEL +0 -0
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.12.1.dist-info}/licenses/LICENSE +0 -0
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.12.1.dist-info}/licenses/LICENSE-THIRD-PARTY.md +0 -0
- {dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.12.1.dist-info}/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
dragon_ml_toolbox-10.12.
|
|
2
|
-
dragon_ml_toolbox-10.12.
|
|
3
|
-
ml_tools/ETL_cleaning.py,sha256=
|
|
1
|
+
dragon_ml_toolbox-10.12.1.dist-info/licenses/LICENSE,sha256=2uUFNy7D0TLgHim1K5s3DIJ4q_KvxEXVilnU20cWliY,1066
|
|
2
|
+
dragon_ml_toolbox-10.12.1.dist-info/licenses/LICENSE-THIRD-PARTY.md,sha256=lY4_rJPnLnMu7YBQaY-_iz1JRDcLdQzNCyeLAF1glJY,1837
|
|
3
|
+
ml_tools/ETL_cleaning.py,sha256=mkbcSTBspGWnHQUAj6hNqJdZ4VXLPFNk1qEY-8rmnZ8,19368
|
|
4
4
|
ml_tools/ETL_engineering.py,sha256=a6KCWH6kRatZtjaFEF_o917ApPMK5_vRD-BjfCDAl-E,49400
|
|
5
5
|
ml_tools/GUI_tools.py,sha256=kEQWg-bog3pB5tI22gMGKWaCGHnz9TB2Lvvfhf5F2CI,45412
|
|
6
6
|
ml_tools/MICE_imputation.py,sha256=kVSythWfxJFR4-2mtcYCWQaQ1Oz5yyx_SJu5gjnS7H8,11670
|
|
@@ -30,7 +30,7 @@ ml_tools/keys.py,sha256=FDpbS3Jb0pjrVvvp2_8nZi919mbob_-xwuy5OOtKM_A,1848
|
|
|
30
30
|
ml_tools/optimization_tools.py,sha256=P3I6lIpvZ8Xf2kX5FvvBKBmrK2pB6idBpkTzfUJxTeE,5073
|
|
31
31
|
ml_tools/path_manager.py,sha256=ke0MYOhYheRPX599GUbrvRsYHn2JKUmMDldS5LP6LQA,18431
|
|
32
32
|
ml_tools/utilities.py,sha256=uheMUjQJ1zI69gASsE-mCq4KlRPVGgrgqson02rGNYM,30755
|
|
33
|
-
dragon_ml_toolbox-10.12.
|
|
34
|
-
dragon_ml_toolbox-10.12.
|
|
35
|
-
dragon_ml_toolbox-10.12.
|
|
36
|
-
dragon_ml_toolbox-10.12.
|
|
33
|
+
dragon_ml_toolbox-10.12.1.dist-info/METADATA,sha256=UIbMyYOgyuJjl1XBoVwWEYg_P-FQQJJmuLsrRNz4Mb4,6969
|
|
34
|
+
dragon_ml_toolbox-10.12.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
35
|
+
dragon_ml_toolbox-10.12.1.dist-info/top_level.txt,sha256=wm-oxax3ciyez6VoO4zsFd-gSok2VipYXnbg3TH9PtU,9
|
|
36
|
+
dragon_ml_toolbox-10.12.1.dist-info/RECORD,,
|
ml_tools/ETL_cleaning.py
CHANGED
|
@@ -142,8 +142,8 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
|
|
|
142
142
|
r'[°˚]': '',
|
|
143
143
|
|
|
144
144
|
# Replace special characters in entries
|
|
145
|
-
r'\\': '
|
|
146
|
-
'/': '
|
|
145
|
+
r'\\': '_',
|
|
146
|
+
# '/': '_', # keep forward slash
|
|
147
147
|
|
|
148
148
|
# Typographical standardization
|
|
149
149
|
# Unify various dashes and hyphens to a standard hyphen
|
|
@@ -157,6 +157,8 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
|
|
|
157
157
|
r'\.{2,}': '.', # Replace two or more dots with a single dot
|
|
158
158
|
r'\?{2,}': '?', # Replace two or more question marks with a single question mark
|
|
159
159
|
r'!{2,}': '!', # Replace two or more exclamation marks with a single one
|
|
160
|
+
r';{2,}': ';',
|
|
161
|
+
r'-{2,}': '-',
|
|
160
162
|
|
|
161
163
|
# 2. Internal Whitespace Consolidation
|
|
162
164
|
# Collapse any sequence of whitespace chars (including non-breaking spaces) to a single space
|
|
@@ -168,7 +170,7 @@ def _cleaner_core(df_in: pl.DataFrame) -> pl.DataFrame:
|
|
|
168
170
|
|
|
169
171
|
# 4. Textual Null Standardization (New Step)
|
|
170
172
|
# Convert common null-like text to actual nulls.
|
|
171
|
-
r'^(N/A|无|NA|NULL|NONE|NIL
|
|
173
|
+
r'^(N/A|无|NA|NULL|NONE|NIL|-|\.|;)$': None,
|
|
172
174
|
|
|
173
175
|
# 5. Final Nullification of Empty Strings
|
|
174
176
|
# After all cleaning, if a string is now empty, convert it to a null
|
|
File without changes
|
{dragon_ml_toolbox-10.12.0.dist-info → dragon_ml_toolbox-10.12.1.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|