rgwfuncs 0.0.13__py3-none-any.whl → 0.0.15__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
rgwfuncs/df_lib.py CHANGED
@@ -1614,7 +1614,6 @@ def mask_against_dataframe_converse(df: pd.DataFrame, other_df: pd.DataFrame, co
1614
1614
 
1615
1615
  return df[~df[column_name].isin(other_df[column_name])]
1616
1616
 
1617
-
1618
1617
  def union_join(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.DataFrame:
1619
1618
  """
1620
1619
  Perform a union join, concatenating the two DataFrames and dropping duplicates.
@@ -1633,19 +1632,19 @@ def union_join(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.DataFrame:
1633
1632
  # print("Initial df1 columns:", df1.columns)
1634
1633
  # print("Initial df2 columns:", df2.columns)
1635
1634
 
1636
- # Standardize columns by adding missing columns filled with NaN
1635
+ # Standardize columns by adding missing columns filled with empty strings
1637
1636
  for col in df2.columns:
1638
1637
  if col not in df1:
1639
- df1[col] = pd.NA
1638
+ df1[col] = ""
1640
1639
 
1641
1640
  for col in df1.columns:
1642
1641
  if col not in df2:
1643
- df2[col] = pd.NA
1642
+ df2[col] = ""
1644
1643
 
1645
1644
  # print("Standardized df1 columns:", df1.columns)
1646
1645
  # print("Standardized df2 columns:", df2.columns)
1647
1646
 
1648
- # Check if columns match now
1647
+ # Ensure they have the same columns after standardizing
1649
1648
  if set(df1.columns) != set(df2.columns):
1650
1649
  raise ValueError("Both DataFrames must have the same columns after standardizing columns")
1651
1650
 
@@ -1653,7 +1652,6 @@ def union_join(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.DataFrame:
1653
1652
  result_df = pd.concat([df1, df2], ignore_index=True).drop_duplicates()
1654
1653
  return result_df
1655
1654
 
1656
-
1657
1655
  def bag_union_join(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.DataFrame:
1658
1656
  """
1659
1657
  Perform a bag union join, concatenating the two DataFrames without dropping duplicates.
@@ -1672,14 +1670,14 @@ def bag_union_join(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.DataFrame:
1672
1670
  # print("Initial df1 columns:", df1.columns)
1673
1671
  # print("Initial df2 columns:", df2.columns)
1674
1672
 
1675
- # Standardize columns by adding missing columns filled with NaN
1673
+ # Standardize columns by adding missing columns filled with empty strings
1676
1674
  for col in df2.columns:
1677
1675
  if col not in df1:
1678
- df1[col] = pd.NA
1676
+ df1[col] = ""
1679
1677
 
1680
1678
  for col in df1.columns:
1681
1679
  if col not in df2:
1682
- df2[col] = pd.NA
1680
+ df2[col] = ""
1683
1681
 
1684
1682
  # print("Standardized df1 columns:", df1.columns)
1685
1683
  # print("Standardized df2 columns:", df2.columns)
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: rgwfuncs
3
- Version: 0.0.13
3
+ Version: 0.0.15
4
4
  Summary: A functional programming paradigm for mathematical modelling and data science
5
5
  Home-page: https://github.com/ryangerardwilson/rgwfunc
6
6
  Author: Ryan Gerard Wilson
@@ -0,0 +1,8 @@
1
+ rgwfuncs/__init__.py,sha256=BP8Nh8ivyCCz8Ga-21JW3NWInJFOElKoIfRuioJRWbA,1076
2
+ rgwfuncs/df_lib.py,sha256=VtCoaxx-ft864ChNZA3YEmvC8muVhFePqJX-j-zCzi0,64110
3
+ rgwfuncs-0.0.15.dist-info/LICENSE,sha256=7EI8xVBu6h_7_JlVw-yPhhOZlpY9hP8wal7kHtqKT_E,1074
4
+ rgwfuncs-0.0.15.dist-info/METADATA,sha256=ULUa8AcemlFS6tmNsG_Oxxvk2USzEsclQgznEC3QKNQ,32059
5
+ rgwfuncs-0.0.15.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
6
+ rgwfuncs-0.0.15.dist-info/entry_points.txt,sha256=j-c5IOPIQ0252EaOV6j6STio56sbXl2C4ym_fQ0lXx0,43
7
+ rgwfuncs-0.0.15.dist-info/top_level.txt,sha256=aGuVIzWsKiV1f2gCb6mynx0zx5ma0B1EwPGFKVEMTi4,9
8
+ rgwfuncs-0.0.15.dist-info/RECORD,,
@@ -1,8 +0,0 @@
1
- rgwfuncs/__init__.py,sha256=BP8Nh8ivyCCz8Ga-21JW3NWInJFOElKoIfRuioJRWbA,1076
2
- rgwfuncs/df_lib.py,sha256=2JU1Z0wjBrpcmLuJgY6-Bi1OFXHyNk1XeRGESkDI934,64077
3
- rgwfuncs-0.0.13.dist-info/LICENSE,sha256=7EI8xVBu6h_7_JlVw-yPhhOZlpY9hP8wal7kHtqKT_E,1074
4
- rgwfuncs-0.0.13.dist-info/METADATA,sha256=TZoSn8ANcHG2IOAW1SwNbu3ZnPKxdWbKzoCAXLTB06w,32059
5
- rgwfuncs-0.0.13.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
6
- rgwfuncs-0.0.13.dist-info/entry_points.txt,sha256=j-c5IOPIQ0252EaOV6j6STio56sbXl2C4ym_fQ0lXx0,43
7
- rgwfuncs-0.0.13.dist-info/top_level.txt,sha256=aGuVIzWsKiV1f2gCb6mynx0zx5ma0B1EwPGFKVEMTi4,9
8
- rgwfuncs-0.0.13.dist-info/RECORD,,