PyPI - imsciences - Versions diffs - 0.6.1.9__py3-none-any.whl → 0.6.2.1__py3-none-any.whl - Mend

imsciences 0.6.1.9py3-none-any.whl → 0.6.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

imsciences/datafunctions.py CHANGED Viewed

@@ -1431,40 +1431,37 @@ class dataprocessing:
         return df
-    def apply_lookup_table_based_on_substring(df, column_name, category_dict, new_col_name='Category', other_label='Other'):
+    def apply_lookup_table_based_on_substring(self, df, column_name, category_dict, new_col_name='Category', other_label='Other'):
         """
         Categorizes text in a specified DataFrame column by applying a lookup table based on substrings.
-        Parameters:
-        - df (pd.DataFrame): The DataFrame containing the column to categorize.
-        - column_name (str): The name of the column in the DataFrame that contains the text data to categorize.
-        - category_dict (dict): A dictionary where keys are substrings to search for in the text and values are
-            the categories to assign when a substring is found.
-        - new_col_name (str): The name of the new column to be created in the DataFrame, which will hold the
-            resulting categories. Default is 'Category'.
+        Args:
+        df (pd.DataFrame): The DataFrame containing the column to categorize.
+        column_name (str): The name of the column in the DataFrame that contains the text data to categorize.
+        category_dict (dict): A dictionary where keys are substrings to search for in the text and values are the categories to assign when a substring is found.
+        new_col_name (str, optional): The name of the new column to be created in the DataFrame, which will hold the resulting categories. Default is 'Category'.
+        other_label (str, optional): The name given to category if no substring from the dictionary is found in the cell
         Returns:
-        - pd.DataFrame: The original DataFrame with an additional column containing the assigned categories.
+        pd.DataFrame: The original DataFrame with an additional column containing the assigned categories.
         """
-        def categorize_text(text, category_dict):
+        def categorize_text(text):
             """
             Assigns a category to a single text string based on the presence of substrings from a dictionary.
-            Parameters:
-            - text (str): The text string to categorize.
-            - category_dict (dict): A dictionary where keys are substrings to search for in the text and
-            values are the categories to assign if a substring is found.
+            Args:
+            text (str): The text string to categorize.
             Returns:
-            - str: The category assigned based on the first matching substring found in the text. If no
-            matching substring is found, returns 'Full Funnel'.
+            str: The category assigned based on the first matching substring found in the text. If no
+            matching substring is found, returns other_name.
             """
             for key, category in category_dict.items():
                 if key.lower() in text.lower():  # Check if the substring is in the text (case-insensitive)
                     return category
             return other_label  # Default category if no match is found
         # Apply the categorize_text function to each element in the specified column
         df[new_col_name] = df[column_name].apply(categorize_text)
         return df

{imsciences-0.6.1.9.dist-info → imsciences-0.6.2.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: imsciences
-Version: 0.6.1.9
+Version: 0.6.2.1
 Summary: IMS Data Processing Package
 Author: IMS
 Author-email: cam@im-sciences.com

{imsciences-0.6.1.9.dist-info → imsciences-0.6.2.1.dist-info}/RECORD RENAMED Viewed

@@ -2,13 +2,13 @@ dataprocessing/__init__.py,sha256=quSwsLs6IuLoA5Rzi0ZD40xZaQudwDteF7_ai9JfTPk,32
 dataprocessing/data-processing-functions.py,sha256=vE1vsZ8xOSbR9Bwlp9SWXwEHXQ0nFydwGkvzHXf2f1Y,41
 dataprocessing/datafunctions.py,sha256=vE1vsZ8xOSbR9Bwlp9SWXwEHXQ0nFydwGkvzHXf2f1Y,41
 imsciences/__init__.py,sha256=GIPbLmWc06sVcOySWwNvMNUr6XGOHqPLryFIWgtpHh8,78
-imsciences/datafunctions.py,sha256=6cBVui4HOCg-ATpnyAQ4BTdRpKr5aJxLbdK9LXy08Xs,139764
+imsciences/datafunctions.py,sha256=zI_vhjBQfa4Lef2NucUViYAJFenEB2RlJ1rnXIIBG5Y,139645
 imsciences/datapull.py,sha256=TPY0LDgOkcKTBk8OekbD0Grg5x0SomAK2dZ7MuT6X1E,19000
 imsciencesdataprocessing/__init__.py,sha256=quSwsLs6IuLoA5Rzi0ZD40xZaQudwDteF7_ai9JfTPk,32
 imsciencesdataprocessing/datafunctions.py,sha256=vE1vsZ8xOSbR9Bwlp9SWXwEHXQ0nFydwGkvzHXf2f1Y,41
 imsdataprocessing/__init__.py,sha256=quSwsLs6IuLoA5Rzi0ZD40xZaQudwDteF7_ai9JfTPk,32
 imsdataprocessing/datafunctions.py,sha256=vE1vsZ8xOSbR9Bwlp9SWXwEHXQ0nFydwGkvzHXf2f1Y,41
-imsciences-0.6.1.9.dist-info/METADATA,sha256=Gl-LWNhdZdav1qd0CYbd6AxI-WbuQ35xvZ-fu-Y02CE,854
-imsciences-0.6.1.9.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
-imsciences-0.6.1.9.dist-info/top_level.txt,sha256=hsENS-AlDVRh8tQJ6-426iUQlla9bPcGc0-UlFF0_iU,11
-imsciences-0.6.1.9.dist-info/RECORD,,
+imsciences-0.6.2.1.dist-info/METADATA,sha256=4p9HLTYPZbsBAkr2dzC1dvvQL-GWZsjTrNXEKGb_5hc,854
+imsciences-0.6.2.1.dist-info/WHEEL,sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ,92
+imsciences-0.6.2.1.dist-info/top_level.txt,sha256=hsENS-AlDVRh8tQJ6-426iUQlla9bPcGc0-UlFF0_iU,11
+imsciences-0.6.2.1.dist-info/RECORD,,

{imsciences-0.6.1.9.dist-info → imsciences-0.6.2.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{imsciences-0.6.1.9.dist-info → imsciences-0.6.2.1.dist-info}/top_level.txt RENAMED Viewed

File without changes

imsciences 0.6.1.9__py3-none-any.whl → 0.6.2.1__py3-none-any.whl

imsciences 0.6.1.9py3-none-any.whl → 0.6.2.1py3-none-any.whl