PyPI - rgwfuncs - Versions diffs - 0.0.9__tar.gz → 0.0.11__tar.gz - Mend

rgwfuncs 0.0.9tar.gz → 0.0.11tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

{rgwfuncs-0.0.9/src/rgwfuncs.egg-info → rgwfuncs-0.0.11}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: rgwfuncs
-Version: 0.0.9
+Version: 0.0.11
 Summary: A functional programming paradigm for mathematical modelling and data science
 Home-page: https://github.com/ryangerardwilson/rgwfunc
 Author: Ryan Gerard Wilson

{rgwfuncs-0.0.9 → rgwfuncs-0.0.11}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "rgwfuncs"
-version = "0.0.9"
+version = "0.0.11"
 authors = [
   { name = "Ryan Gerard Wilson", email = "ryangerardwilson@gmail.com" },
 ]

{rgwfuncs-0.0.9 → rgwfuncs-0.0.11}/setup.cfg RENAMED Viewed

@@ -1,6 +1,6 @@
 [metadata]
 name = rgwfuncs
-version = 0.0.9
+version = 0.0.11
 author = Ryan Gerard Wilson
 author_email = ryangerardwilson@gmail.com
 description = A functional programming paradigm for mathematical modelling and data science

{rgwfuncs-0.0.9 → rgwfuncs-0.0.11}/src/rgwfuncs/df_lib.py RENAMED Viewed

@@ -1631,10 +1631,27 @@ def union_join(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.DataFrame:
     if set(df1.columns) != set(df2.columns):
         raise ValueError("Both DataFrames must have the same columns for a union join")
-    result_df = pd.concat([df1, df2], ignore_index=True).drop_duplicates()
+    # Inspect initial columns
+    print("Initial df1 columns:", df1.columns)
+    print("Initial df2 columns:", df2.columns)
+    # Drop all-NA columns, if any
+    df1_clean = df1.dropna(axis=1, how='all')
+    df2_clean = df2.dropna(axis=1, how='all')
+    # Inspect resulting columns after dropping all-NA columns
+    print("Cleaned df1 columns:", df1_clean.columns)
+    print("Cleaned df2 columns:", df2_clean.columns)
+    # Ensure they still have the same columns after dropping all-NA columns
+    if set(df1_clean.columns) != set(df2_clean.columns):
+        raise ValueError("Both DataFrames must have the same columns after dropping all-NA columns")
+    result_df = pd.concat([df1_clean, df2_clean], ignore_index=True).drop_duplicates()
     return result_df
 def bag_union_join(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.DataFrame:
     """
     Perform a bag union join, concatenating the two DataFrames without dropping duplicates.
@@ -1652,7 +1669,15 @@ def bag_union_join(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.DataFrame:
     if set(df1.columns) != set(df2.columns):
         raise ValueError("Both DataFrames must have the same columns for a bag union join")
-    result_df = pd.concat([df1, df2], ignore_index=True)
+    # Drop all-NA columns, if any
+    df1_clean = df1.dropna(axis=1, how='all')
+    df2_clean = df2.dropna(axis=1, how='all')
+    # Ensure they still have the same columns after dropping all-NA columns
+    if set(df1_clean.columns) != set(df2_clean.columns):
+        raise ValueError("Both DataFrames must have the same columns after dropping all-NA columns")
+    result_df = pd.concat([df1_clean, df2_clean], ignore_index=True)
     return result_df

{rgwfuncs-0.0.9 → rgwfuncs-0.0.11/src/rgwfuncs.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: rgwfuncs
-Version: 0.0.9
+Version: 0.0.11
 Summary: A functional programming paradigm for mathematical modelling and data science
 Home-page: https://github.com/ryangerardwilson/rgwfunc
 Author: Ryan Gerard Wilson