PyPI - dragon-ml-toolbox - Versions diffs - 19.14.0__py3-none-any.whl → 20.0.0__py3-none-any.whl - Mend

dragon-ml-toolbox 19.14.0py3-none-any.whl → 20.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (219) hide show

{dragon_ml_toolbox-19.14.0.dist-info → dragon_ml_toolbox-20.0.0.dist-info}/METADATA +29 -46
dragon_ml_toolbox-20.0.0.dist-info/RECORD +178 -0
ml_tools/{ETL_cleaning.py → ETL_cleaning/__init__.py} +13 -5
ml_tools/ETL_cleaning/_basic_clean.py +351 -0
ml_tools/ETL_cleaning/_clean_tools.py +128 -0
ml_tools/ETL_cleaning/_dragon_cleaner.py +245 -0
ml_tools/ETL_cleaning/_imprimir.py +13 -0
ml_tools/{ETL_engineering.py → ETL_engineering/__init__.py} +8 -4
ml_tools/ETL_engineering/_dragon_engineering.py +261 -0
ml_tools/ETL_engineering/_imprimir.py +24 -0
ml_tools/{_core/_ETL_engineering.py → ETL_engineering/_transforms.py} +14 -267
ml_tools/{_core → GUI_tools}/_GUI_tools.py +37 -40
ml_tools/{GUI_tools.py → GUI_tools/__init__.py} +7 -5
ml_tools/GUI_tools/_imprimir.py +12 -0
ml_tools/IO_tools/_IO_loggers.py +235 -0
ml_tools/IO_tools/_IO_save_load.py +151 -0
ml_tools/IO_tools/_IO_utils.py +140 -0
ml_tools/{IO_tools.py → IO_tools/__init__.py} +13 -5
ml_tools/IO_tools/_imprimir.py +14 -0
ml_tools/MICE/_MICE_imputation.py +132 -0
ml_tools/{MICE_imputation.py → MICE/__init__.py} +6 -7
ml_tools/{_core/_MICE_imputation.py → MICE/_dragon_mice.py} +243 -322
ml_tools/MICE/_imprimir.py +11 -0
ml_tools/{ML_callbacks.py → ML_callbacks/__init__.py} +12 -4
ml_tools/ML_callbacks/_base.py +101 -0
ml_tools/ML_callbacks/_checkpoint.py +232 -0
ml_tools/ML_callbacks/_early_stop.py +208 -0
ml_tools/ML_callbacks/_imprimir.py +12 -0
ml_tools/ML_callbacks/_scheduler.py +197 -0
ml_tools/{ML_chaining_utilities.py → ML_chain/__init__.py} +8 -3
ml_tools/{_core/_ML_chaining_utilities.py → ML_chain/_chaining_tools.py} +5 -129
ml_tools/ML_chain/_dragon_chain.py +140 -0
ml_tools/ML_chain/_imprimir.py +11 -0
ml_tools/ML_configuration/__init__.py +90 -0
ml_tools/ML_configuration/_base_model_config.py +69 -0
ml_tools/ML_configuration/_finalize.py +366 -0
ml_tools/ML_configuration/_imprimir.py +47 -0
ml_tools/ML_configuration/_metrics.py +593 -0
ml_tools/ML_configuration/_models.py +206 -0
ml_tools/ML_configuration/_training.py +124 -0
ml_tools/ML_datasetmaster/__init__.py +28 -0
ml_tools/ML_datasetmaster/_base_datasetmaster.py +337 -0
ml_tools/{_core/_ML_datasetmaster.py → ML_datasetmaster/_datasetmaster.py} +9 -329
ml_tools/ML_datasetmaster/_imprimir.py +15 -0
ml_tools/{_core/_ML_sequence_datasetmaster.py → ML_datasetmaster/_sequence_datasetmaster.py} +13 -15
ml_tools/{_core/_ML_vision_datasetmaster.py → ML_datasetmaster/_vision_datasetmaster.py} +63 -65
ml_tools/ML_evaluation/__init__.py +53 -0
ml_tools/ML_evaluation/_classification.py +629 -0
ml_tools/ML_evaluation/_feature_importance.py +409 -0
ml_tools/ML_evaluation/_imprimir.py +25 -0
ml_tools/ML_evaluation/_loss.py +92 -0
ml_tools/ML_evaluation/_regression.py +273 -0
ml_tools/{_core/_ML_sequence_evaluation.py → ML_evaluation/_sequence.py} +8 -11
ml_tools/{_core/_ML_vision_evaluation.py → ML_evaluation/_vision.py} +12 -17
ml_tools/{_core → ML_evaluation_captum}/_ML_evaluation_captum.py +11 -38
ml_tools/{ML_evaluation_captum.py → ML_evaluation_captum/__init__.py} +6 -4
ml_tools/ML_evaluation_captum/_imprimir.py +10 -0
ml_tools/{_core → ML_finalize_handler}/_ML_finalize_handler.py +3 -7
ml_tools/ML_finalize_handler/__init__.py +10 -0
ml_tools/ML_finalize_handler/_imprimir.py +8 -0
ml_tools/ML_inference/__init__.py +22 -0
ml_tools/ML_inference/_base_inference.py +166 -0
ml_tools/{_core/_ML_chaining_inference.py → ML_inference/_chain_inference.py} +14 -17
ml_tools/ML_inference/_dragon_inference.py +332 -0
ml_tools/ML_inference/_imprimir.py +11 -0
ml_tools/ML_inference/_multi_inference.py +180 -0
ml_tools/ML_inference_sequence/__init__.py +10 -0
ml_tools/ML_inference_sequence/_imprimir.py +8 -0
ml_tools/{_core/_ML_sequence_inference.py → ML_inference_sequence/_sequence_inference.py} +11 -15
ml_tools/ML_inference_vision/__init__.py +10 -0
ml_tools/ML_inference_vision/_imprimir.py +8 -0
ml_tools/{_core/_ML_vision_inference.py → ML_inference_vision/_vision_inference.py} +15 -19
ml_tools/ML_models/__init__.py +32 -0
ml_tools/{_core/_ML_models_advanced.py → ML_models/_advanced_models.py} +22 -18
ml_tools/ML_models/_base_mlp_attention.py +198 -0
ml_tools/{_core/_models_advanced_base.py → ML_models/_base_save_load.py} +73 -49
ml_tools/ML_models/_dragon_tabular.py +248 -0
ml_tools/ML_models/_imprimir.py +18 -0
ml_tools/ML_models/_mlp_attention.py +134 -0
ml_tools/{_core → ML_models}/_models_advanced_helpers.py +13 -13
ml_tools/ML_models_sequence/__init__.py +10 -0
ml_tools/ML_models_sequence/_imprimir.py +8 -0
ml_tools/{_core/_ML_sequence_models.py → ML_models_sequence/_sequence_models.py} +5 -8
ml_tools/ML_models_vision/__init__.py +29 -0
ml_tools/ML_models_vision/_base_wrapper.py +254 -0
ml_tools/ML_models_vision/_image_classification.py +182 -0
ml_tools/ML_models_vision/_image_segmentation.py +108 -0
ml_tools/ML_models_vision/_imprimir.py +16 -0
ml_tools/ML_models_vision/_object_detection.py +135 -0
ml_tools/ML_optimization/__init__.py +21 -0
ml_tools/ML_optimization/_imprimir.py +13 -0
ml_tools/{_core/_ML_optimization_pareto.py → ML_optimization/_multi_dragon.py} +18 -24
ml_tools/ML_optimization/_single_dragon.py +203 -0
ml_tools/{_core/_ML_optimization.py → ML_optimization/_single_manual.py} +75 -213
ml_tools/{_core → ML_scaler}/_ML_scaler.py +8 -11
ml_tools/ML_scaler/__init__.py +10 -0
ml_tools/ML_scaler/_imprimir.py +8 -0
ml_tools/ML_trainer/__init__.py +20 -0
ml_tools/ML_trainer/_base_trainer.py +297 -0
ml_tools/ML_trainer/_dragon_detection_trainer.py +402 -0
ml_tools/ML_trainer/_dragon_sequence_trainer.py +540 -0
ml_tools/ML_trainer/_dragon_trainer.py +1160 -0
ml_tools/ML_trainer/_imprimir.py +10 -0
ml_tools/{ML_utilities.py → ML_utilities/__init__.py} +14 -6
ml_tools/ML_utilities/_artifact_finder.py +382 -0
ml_tools/ML_utilities/_imprimir.py +16 -0
ml_tools/ML_utilities/_inspection.py +325 -0
ml_tools/ML_utilities/_train_tools.py +205 -0
ml_tools/{ML_vision_transformers.py → ML_vision_transformers/__init__.py} +9 -6
ml_tools/{_core/_ML_vision_transformers.py → ML_vision_transformers/_core_transforms.py} +11 -155
ml_tools/ML_vision_transformers/_imprimir.py +14 -0
ml_tools/ML_vision_transformers/_offline_augmentation.py +159 -0
ml_tools/{_core/_PSO_optimization.py → PSO_optimization/_PSO.py} +58 -15
ml_tools/{PSO_optimization.py → PSO_optimization/__init__.py} +5 -3
ml_tools/PSO_optimization/_imprimir.py +10 -0
ml_tools/SQL/__init__.py +7 -0
ml_tools/{_core/_SQL.py → SQL/_dragon_SQL.py} +7 -11
ml_tools/SQL/_imprimir.py +8 -0
ml_tools/{_core → VIF}/_VIF_factor.py +5 -8
ml_tools/{VIF_factor.py → VIF/__init__.py} +4 -2
ml_tools/VIF/_imprimir.py +10 -0
ml_tools/_core/__init__.py +7 -1
ml_tools/_core/_logger.py +8 -18
ml_tools/_core/_schema_load_ops.py +43 -0
ml_tools/_core/_script_info.py +2 -2
ml_tools/{data_exploration.py → data_exploration/__init__.py} +32 -16
ml_tools/data_exploration/_analysis.py +214 -0
ml_tools/data_exploration/_cleaning.py +566 -0
ml_tools/data_exploration/_features.py +583 -0
ml_tools/data_exploration/_imprimir.py +32 -0
ml_tools/data_exploration/_plotting.py +487 -0
ml_tools/data_exploration/_schema_ops.py +176 -0
ml_tools/{ensemble_evaluation.py → ensemble_evaluation/__init__.py} +6 -4
ml_tools/{_core → ensemble_evaluation}/_ensemble_evaluation.py +3 -7
ml_tools/ensemble_evaluation/_imprimir.py +14 -0
ml_tools/{ensemble_inference.py → ensemble_inference/__init__.py} +5 -3
ml_tools/{_core → ensemble_inference}/_ensemble_inference.py +15 -18
ml_tools/ensemble_inference/_imprimir.py +9 -0
ml_tools/{ensemble_learning.py → ensemble_learning/__init__.py} +4 -6
ml_tools/{_core → ensemble_learning}/_ensemble_learning.py +7 -10
ml_tools/ensemble_learning/_imprimir.py +10 -0
ml_tools/{excel_handler.py → excel_handler/__init__.py} +5 -3
ml_tools/{_core → excel_handler}/_excel_handler.py +6 -10
ml_tools/excel_handler/_imprimir.py +13 -0
ml_tools/{keys.py → keys/__init__.py} +4 -1
ml_tools/keys/_imprimir.py +11 -0
ml_tools/{_core → keys}/_keys.py +2 -0
ml_tools/{math_utilities.py → math_utilities/__init__.py} +5 -2
ml_tools/math_utilities/_imprimir.py +11 -0
ml_tools/{_core → math_utilities}/_math_utilities.py +1 -5
ml_tools/{optimization_tools.py → optimization_tools/__init__.py} +9 -4
ml_tools/optimization_tools/_imprimir.py +13 -0
ml_tools/optimization_tools/_optimization_bounds.py +236 -0
ml_tools/optimization_tools/_optimization_plots.py +218 -0
ml_tools/{path_manager.py → path_manager/__init__.py} +6 -3
ml_tools/{_core/_path_manager.py → path_manager/_dragonmanager.py} +11 -347
ml_tools/path_manager/_imprimir.py +15 -0
ml_tools/path_manager/_path_tools.py +346 -0
ml_tools/plot_fonts/__init__.py +8 -0
ml_tools/plot_fonts/_imprimir.py +8 -0
ml_tools/{_core → plot_fonts}/_plot_fonts.py +2 -5
ml_tools/schema/__init__.py +15 -0
ml_tools/schema/_feature_schema.py +223 -0
ml_tools/schema/_gui_schema.py +191 -0
ml_tools/schema/_imprimir.py +10 -0
ml_tools/{serde.py → serde/__init__.py} +4 -2
ml_tools/serde/_imprimir.py +10 -0
ml_tools/{_core → serde}/_serde.py +3 -8
ml_tools/{utilities.py → utilities/__init__.py} +11 -6
ml_tools/utilities/_imprimir.py +18 -0
ml_tools/{_core/_utilities.py → utilities/_utility_save_load.py} +13 -190
ml_tools/utilities/_utility_tools.py +192 -0
dragon_ml_toolbox-19.14.0.dist-info/RECORD +0 -111
ml_tools/ML_chaining_inference.py +0 -8
ml_tools/ML_configuration.py +0 -86
ml_tools/ML_configuration_pytab.py +0 -14
ml_tools/ML_datasetmaster.py +0 -10
ml_tools/ML_evaluation.py +0 -16
ml_tools/ML_evaluation_multi.py +0 -12
ml_tools/ML_finalize_handler.py +0 -8
ml_tools/ML_inference.py +0 -12
ml_tools/ML_models.py +0 -14
ml_tools/ML_models_advanced.py +0 -14
ml_tools/ML_models_pytab.py +0 -14
ml_tools/ML_optimization.py +0 -14
ml_tools/ML_optimization_pareto.py +0 -8
ml_tools/ML_scaler.py +0 -8
ml_tools/ML_sequence_datasetmaster.py +0 -8
ml_tools/ML_sequence_evaluation.py +0 -10
ml_tools/ML_sequence_inference.py +0 -8
ml_tools/ML_sequence_models.py +0 -8
ml_tools/ML_trainer.py +0 -12
ml_tools/ML_vision_datasetmaster.py +0 -12
ml_tools/ML_vision_evaluation.py +0 -10
ml_tools/ML_vision_inference.py +0 -8
ml_tools/ML_vision_models.py +0 -18
ml_tools/SQL.py +0 -8
ml_tools/_core/_ETL_cleaning.py +0 -694
ml_tools/_core/_IO_tools.py +0 -498
ml_tools/_core/_ML_callbacks.py +0 -702
ml_tools/_core/_ML_configuration.py +0 -1332
ml_tools/_core/_ML_configuration_pytab.py +0 -102
ml_tools/_core/_ML_evaluation.py +0 -867
ml_tools/_core/_ML_evaluation_multi.py +0 -544
ml_tools/_core/_ML_inference.py +0 -646
ml_tools/_core/_ML_models.py +0 -668
ml_tools/_core/_ML_models_pytab.py +0 -693
ml_tools/_core/_ML_trainer.py +0 -2323
ml_tools/_core/_ML_utilities.py +0 -886
ml_tools/_core/_ML_vision_models.py +0 -644
ml_tools/_core/_data_exploration.py +0 -1909
ml_tools/_core/_optimization_tools.py +0 -493
ml_tools/_core/_schema.py +0 -359
ml_tools/plot_fonts.py +0 -8
ml_tools/schema.py +0 -12
{dragon_ml_toolbox-19.14.0.dist-info → dragon_ml_toolbox-20.0.0.dist-info}/WHEEL +0 -0
{dragon_ml_toolbox-19.14.0.dist-info → dragon_ml_toolbox-20.0.0.dist-info}/licenses/LICENSE +0 -0
{dragon_ml_toolbox-19.14.0.dist-info → dragon_ml_toolbox-20.0.0.dist-info}/licenses/LICENSE-THIRD-PARTY.md +0 -0
{dragon_ml_toolbox-19.14.0.dist-info → dragon_ml_toolbox-20.0.0.dist-info}/top_level.txt +0 -0

ml_tools/{_core/_ETL_engineering.py → ETL_engineering/_transforms.py} RENAMED Viewed

@@ -1,22 +1,16 @@
 import polars as pl
 import re
-from pathlib import Path
-from typing import Literal, Union, Optional, Any, Callable, List, Dict, Tuple
+from typing import Literal, Union, Optional
-from ._utilities import load_dataframe, save_dataframe_filename
-from ._path_manager import make_fullpath
-from ._script_info import _script_info
-from ._logger import get_logger
 from ..constants import CHEMICAL_ELEMENT_SYMBOLS
-from ._keys import MagicWords
+from .._core import get_logger
-_LOGGER = get_logger("ETL Engineering")
+_LOGGER = get_logger("ETL Transforms")
 __all__ = [
-    "DragonTransformRecipe",
-    "DragonProcessor",
     "BinaryTransformer",
     "MultiBinaryDummifier",
     "AutoDummifier",
@@ -34,250 +28,6 @@ __all__ = [
     "MolecularFormulaTransformer"
 ]
-############ TRANSFORM MAIN ####################
-class DragonTransformRecipe:
-    """
-    A builder class for creating a data transformation recipe.
-    This class provides a structured way to define a series of transformation
-    steps, with validation performed at the time of addition. It is designed
-    to be passed to a `DragonProcessor`.
-    Use the method `add()` to add recipes.
-    """
-    def __init__(self):
-        self._steps: List[Dict[str, Any]] = []
-    def add(
-        self,
-        input_col_name: str,
-        transform: Union[str, Callable],
-        output_col_names: Optional[Union[str, List[str]]] = None
-    ) -> "DragonTransformRecipe":
-        """
-        Adds a new transformation step to the recipe.
-        Args:
-            input_col_name: The name of the column from the source DataFrame.
-            output_col_names: The desired name(s) for the output column(s).
-                        - A string for a 1-to-1 mapping.
-                        - A list of strings for a 1-to-many mapping.
-                        - A string prefix for 1-to-many mapping.
-                        - If None, the input name is used for 1-to-1 transforms,
-                          or the transformer's default names are used for 1-to-many.
-            transform: The transformation to apply:
-                - Use "rename" for simple column renaming
-                - If callable, must accept a `pl.Series` as the only parameter and return either a `pl.Series` or `pl.DataFrame`.
-        Returns:
-            The instance of the recipe itself to allow for method chaining.
-        """
-        # --- Validation ---
-        if not isinstance(input_col_name, str) or not input_col_name:
-            _LOGGER.error("'input_col' must be a non-empty string.")
-            raise TypeError()
-        if transform == MagicWords.RENAME:
-            if not isinstance(output_col_names, str):
-                _LOGGER.error("For a RENAME operation, 'output_col' must be a string.")
-                raise TypeError()
-        elif not isinstance(transform, Callable):
-            _LOGGER.error(f"'transform' must be a callable function or the string '{MagicWords.RENAME}'.")
-            raise TypeError()
-        # --- Add Step ---
-        step = {
-            "input_col": input_col_name,
-            "output_col": output_col_names,
-            "transform": transform,
-        }
-        self._steps.append(step)
-        return self  # Allow chaining: recipe.add(...).add(...)
-    def __iter__(self):
-        """Allows the class to be iterated over, like a list."""
-        return iter(self._steps)
-    def __len__(self):
-        """Allows the len() function to be used on an instance."""
-        return len(self._steps)
-class DragonProcessor:
-    """
-    Transforms a Polars DataFrame based on a provided `DragonTransformRecipe` object.
-    Use the methods `transform()` or `load_transform_save()`.
-    """
-    def __init__(self, recipe: DragonTransformRecipe):
-        """
-        Initializes the DragonProcessor with a transformation recipe.
-        Args:
-            recipe: An instance of the `DragonTransformRecipe` class that has
-                    been populated with transformation steps.
-        """
-        if not isinstance(recipe, DragonTransformRecipe):
-            _LOGGER.error("The recipe must be an instance of DragonTransformRecipe.")
-            raise TypeError()
-        if len(recipe) == 0:
-            _LOGGER.error("The recipe cannot be empty.")
-            raise ValueError()
-        self._recipe = recipe
-    def transform(self, df: pl.DataFrame) -> pl.DataFrame:
-        """
-        Applies the transformation recipe to the input DataFrame.
-        """
-        processed_columns = []
-        # Recipe object is iterable
-        for step in self._recipe:
-            input_col_name = step["input_col"]
-            output_col_spec = step["output_col"]
-            transform_action = step["transform"]
-            if input_col_name not in df.columns:
-                _LOGGER.error(f"Input column '{input_col_name}' not found in DataFrame.")
-                raise ValueError()
-            input_series = df.get_column(input_col_name)
-            if transform_action == MagicWords.RENAME:
-                processed_columns.append(input_series.alias(output_col_spec))
-                continue
-            if isinstance(transform_action, Callable):
-                result = transform_action(input_series)
-                if isinstance(result, pl.Series):
-                    # Default to input name if spec is None
-                    output_name = output_col_spec if output_col_spec is not None else input_col_name
-                    if not isinstance(output_name, str):
-                        _LOGGER.error(f"Function for '{input_col_name}' returned a Series but 'output_col' must be a string or None.")
-                        raise TypeError()
-                    processed_columns.append(result.alias(output_name))
-                elif isinstance(result, pl.DataFrame):
-                    # 1. Handle None in output names
-                    if output_col_spec is None:
-                        # Use the column names generated by the transformer directly
-                        processed_columns.extend(result.get_columns())
-                    # 2. Handle list-based renaming
-                    elif isinstance(output_col_spec, list):
-                        if len(result.columns) != len(output_col_spec):
-                            _LOGGER.error(f"Mismatch in '{input_col_name}': function produced {len(result.columns)} columns, but recipe specifies {len(output_col_spec)} output names.")
-                            raise ValueError()
-                        renamed_df = result.rename(dict(zip(result.columns, output_col_spec)))
-                        processed_columns.extend(renamed_df.get_columns())
-                    # 3. Global logic for adding a single prefix to all columns.
-                    elif isinstance(output_col_spec, str):
-                        prefix = output_col_spec
-                        new_names = {}
-                        for col in result.columns:
-                            # Case 1: Transformer's output column name contains the input name.
-                            # Action: Replace the input name with the desired prefix.
-                            # Example: input='color', output='color_red', prefix='spec' -> 'spec_red'
-                            # if input_col_name in col:
-                            if col.startswith(input_col_name):
-                                new_names[col] = col.replace(input_col_name, prefix, 1)
-                            # Case 2: Transformer's output is an independent name.
-                            # Action: Prepend the prefix to the output name.
-                            # Example: input='ratio', output='A_B', prefix='spec' -> 'spec_A_B'
-                            else:
-                                new_names[col] = f"{prefix}_{col}"
-                        renamed_df = result.rename(new_names)
-                        processed_columns.extend(renamed_df.get_columns())
-                    else:
-                        _LOGGER.error(f"Function for '{input_col_name}' returned a DataFrame, so 'output_col' must be a list of names, a string prefix, or None.")
-                        raise TypeError()
-                else:
-                    _LOGGER.error(f"Function for '{input_col_name}' returned an unexpected type: {type(result)}.")
-                    raise TypeError()
-            else: # This case is unlikely due to builder validation.
-                _LOGGER.error(f"Invalid 'transform' action for '{input_col_name}': {transform_action}")
-                raise TypeError()
-        if not processed_columns:
-            _LOGGER.error("The transformation resulted in an empty DataFrame.")
-            return pl.DataFrame()
-        _LOGGER.info(f"Processed dataframe with {len(processed_columns)} columns.")
-        return pl.DataFrame(processed_columns)
-    def load_transform_save(self, input_path: Union[str,Path], output_path: Union[str,Path]):
-        """
-        Convenience wrapper for the transform method that includes automatic dataframe loading and saving.
-        """
-        # Validate paths
-        in_path = make_fullpath(input_path, enforce="file")
-        out_path = make_fullpath(output_path, make=True, enforce="file")
-        # load df
-        df, _ = load_dataframe(df_path=in_path, kind="polars", all_strings=True)
-        # Process
-        df_processed = self.transform(df)
-        # save processed df
-        save_dataframe_filename(df=df_processed, save_dir=out_path.parent, filename=out_path.name)
-    def __str__(self) -> str:
-        """
-        Provides a detailed, human-readable string representation of the
-        entire processing pipeline.
-        """
-        header = "DragonProcessor Pipeline"
-        divider = "-" * len(header)
-        num_steps = len(self._recipe)
-        lines = [
-            header,
-            divider,
-            f"Number of steps: {num_steps}\n"
-        ]
-        if num_steps == 0:
-            lines.append("No transformation steps defined.")
-            return "\n".join(lines)
-        for i, step in enumerate(self._recipe, 1):
-            transform_action = step["transform"]
-            # Get a clean name for the transformation action
-            if transform_action == MagicWords.RENAME: # "rename"
-                transform_name = "Rename"
-            else:
-                # This works for both functions and class instances
-                transform_name = type(transform_action).__name__
-            lines.append(f"[{i}] Input: '{step['input_col']}'")
-            lines.append(f"    - Transform: {transform_name}")
-            lines.append(f"    - Output(s): {step['output_col']}")
-            if i < num_steps:
-                lines.append("") # Add a blank line between steps
-        return "\n".join(lines)
-    def inspect(self) -> None:
-        """
-        Prints the detailed string representation of the pipeline to the console.
-        """
-        print(self)
-############ TRANSFORMERS ####################
 class BinaryTransformer:
     """
@@ -285,8 +35,8 @@ class BinaryTransformer:
     """
     def __init__(
         self,
-        true_keywords: Optional[List[str]] = None,
-        false_keywords: Optional[List[str]] = None,
+        true_keywords: Optional[list[str]] = None,
+        false_keywords: Optional[list[str]] = None,
         case_insensitive: bool = True,
         use_regex: bool = False
     ):
@@ -407,7 +157,7 @@ class MultiBinaryDummifier:
     text column based on a list of keywords or regex patterns.
     """
     def __init__(self,
-                 keywords: List[str],
+                 keywords: list[str],
                  case_insensitive: bool = True,
                  use_regex: bool = False):
         """
@@ -499,8 +249,8 @@ class KeywordDummifier:
     """
     def __init__(
         self,
-        group_names: List[str],
-        group_keywords: List[List[str]],
+        group_names: list[str],
+        group_keywords: list[list[str]],
         case_insensitive: bool = True,
         use_regex: bool = False
     ):
@@ -1099,7 +849,7 @@ class CategoryMapper:
     """
     def __init__(
         self,
-        mapping: Dict[str, Union[int, float]],
+        mapping: dict[str, Union[int, float]],
         unseen_value: Optional[Union[int, float]] = None,
     ):
         if not isinstance(mapping, dict):
@@ -1160,7 +910,7 @@ class RegexMapper:
     """
     def __init__(
         self,
-        mapping: Dict[str, Union[int, float]],
+        mapping: dict[str, Union[int, float]],
         unseen_value: Optional[Union[int, float]] = None,
         case_insensitive: bool = True,
     ):
@@ -1173,7 +923,7 @@ class RegexMapper:
         # --- Process and validate patterns ---
         # Process patterns here to be more efficient, avoiding reprocessing on every __call__.
-        self.processed_mapping: List[Tuple[str, Union[int, float]]] = []
+        self.processed_mapping: list[tuple[str, Union[int, float]]] = []
         for pattern, value in mapping.items():
             final_pattern = f"(?i){pattern}" if case_insensitive else pattern
@@ -1224,7 +974,7 @@ class ValueBinner:
     """
     def __init__(
         self,
-        breaks: List[Union[int, float]],
+        breaks: list[Union[int, float]],
         left_closed: bool = False,
     ):
         """
@@ -1294,7 +1044,7 @@ class DateFeatureExtractor:
     def __init__(
         self,
-        features: List[str],
+        features: list[str],
         format: Optional[str] = None,
     ):
         """
@@ -1422,6 +1172,3 @@ class MolecularFormulaTransformer:
         return base_df.select(select_expressions)
-def info():
-    _script_info(__all__)

ml_tools/{_core → GUI_tools}/_GUI_tools.py RENAMED Viewed

@@ -3,14 +3,13 @@ from pathlib import Path
 import traceback
 import FreeSimpleGUI as sg
 from functools import wraps
-from typing import Any, Dict, Tuple, List, Literal, Union, Optional, Callable
+from typing import Any, Literal, Union, Optional, Callable
 import numpy as np
 import json
-from ._script_info import _script_info
-from ._path_manager import make_fullpath
-from ._logger import get_logger
-from ._keys import _OneHotOtherPlaceholder, SchemaKeys
+from ..path_manager import make_fullpath
+from .._core import get_logger
+from ..keys._keys import _OneHotOtherPlaceholder, SchemaKeys
 _LOGGER = get_logger("GUI Tools")
@@ -19,9 +18,9 @@ _LOGGER = get_logger("GUI Tools")
 __all__ = [
     "DragonGUIConfig",
     "DragonGUIFactory",
-    "catch_exceptions",
     "DragonFeatureMaster",
-    "DragonGUIHandler"
+    "DragonGUIHandler",
+    "catch_exceptions",
 ]
 # --- Configuration Management ---
@@ -197,7 +196,7 @@ class DragonGUIFactory:
         }
         return sg.Button(text.title(), key=key, **style_args)
-    def make_frame(self, title: str, layout: List[List[Union[sg.Element, sg.Column]]], center_layout: bool = False, **kwargs) -> sg.Frame:
+    def make_frame(self, title: str, layout: list[list[Union[sg.Element, sg.Column]]], center_layout: bool = False, **kwargs) -> sg.Frame:
         """
         Creates a styled frame around a given layout.
@@ -226,12 +225,12 @@ class DragonGUIFactory:
     # --- General-Purpose Layout Generators ---
     def generate_continuous_layout(
         self,
-        data_dict: Dict[str, Union[Tuple[Union[int,float,None], Union[int,float,None]],List[Union[int,float,None]]]],
+        data_dict: dict[str, Union[tuple[Union[int,float,None], Union[int,float,None]],list[Union[int,float,None]]]],
         is_target: bool = False,
         layout_mode: Literal["grid", "row"] = 'grid',
         number_columns: int = 5,
         center_layout: bool = True
-    ) -> List[List[sg.Column]]:
+    ) -> list[list[sg.Column]]:
         """
         Generates a layout for continuous features or targets.
@@ -292,11 +291,11 @@ class DragonGUIFactory:
     def generate_combo_layout(
         self,
-        data_dict: Dict[str, Union[List[Any],Tuple[Any,...]]],
+        data_dict: dict[str, Union[list[Any],tuple[Any,...]]],
         layout_mode: Literal["grid", "row"] = 'grid',
         number_columns: int = 5,
         center_layout: bool = True
-    ) -> List[List[sg.Column]]:
+    ) -> list[list[sg.Column]]:
         """
         Generates a layout for categorical or binary features using Combo boxes.
@@ -334,11 +333,11 @@ class DragonGUIFactory:
     def generate_multiselect_layout(
         self,
-        data_dict: Dict[str, Union[List[Any], Tuple[Any, ...]]],
+        data_dict: dict[str, Union[list[Any], tuple[Any, ...]]],
         layout_mode: Literal["grid", "row"] = 'grid',
         number_columns: int = 5,
         center_layout: bool = True
-    ) -> List[List[sg.Column]]:
+    ) -> list[list[sg.Column]]:
         """
         Generates a layout for features using Listbox elements for multiple selections.
@@ -386,7 +385,7 @@ class DragonGUIFactory:
         return self._build_grid_layout(all_feature_layouts, number_columns, bg_color, center_layout) # type: ignore
     # --- Window Creation ---
-    def create_window(self, title: str, layout: List[List[sg.Element]], **kwargs) -> sg.Window:
+    def create_window(self, title: str, layout: list[list[sg.Element]], **kwargs) -> sg.Window:
         """
         Creates and finalizes the main application window.
@@ -413,7 +412,7 @@ class DragonGUIFactory:
         return window
-    def _build_grid_layout(self, all_feature_layouts: List[sg.Column], num_columns: int, bg_color: str, center_layout: bool = True) -> List[List[sg.Column]]:
+    def _build_grid_layout(self, all_feature_layouts: list[sg.Column], num_columns: int, bg_color: str, center_layout: bool = True) -> list[list[sg.Column]]:
         """
         Private helper to distribute feature layouts vertically into a grid of columns.
         """
@@ -485,12 +484,12 @@ class DragonFeatureMaster:
     for each feature type.
     """
     def __init__(self,
-                 targets: Dict[str, str],
-                 continuous_features: Optional[Dict[str, Tuple[str, float, float]]] = None,
-                 binary_features: Optional[Dict[str, str]] = None,
-                 multi_binary_features: Optional[Dict[str, Dict[str, str]]] = None,
-                 one_hot_features: Optional[Dict[str, Dict[str, str]]] = None,
-                 categorical_features: Optional[List[Tuple[str, str, Dict[str, int]]]] = None,
+                 targets: dict[str, str],
+                 continuous_features: Optional[dict[str, tuple[str, float, float]]] = None,
+                 binary_features: Optional[dict[str, str]] = None,
+                 multi_binary_features: Optional[dict[str, dict[str, str]]] = None,
+                 one_hot_features: Optional[dict[str, dict[str, str]]] = None,
+                 categorical_features: Optional[list[tuple[str, str, dict[str, int]]]] = None,
                  add_one_hot_other_placeholder: bool = True) -> None:
         """
         Initializes the DragonFeatureMaster instance by processing feature and target definitions.
@@ -690,26 +689,26 @@ class DragonFeatureMaster:
             add_one_hot_other_placeholder=False
         )
-    def _handle_targets(self, targets: Dict[str, str]):
+    def _handle_targets(self, targets: dict[str, str]):
         # Make dictionary GUI name: range values
         gui_values: dict[str, tuple[None,None]] = {gui_key: (None, None) for gui_key in targets.keys()}
         # Map GUI name to Model name (same as input)
         return gui_values
-    def _handle_continuous_features(self, continuous_features: Dict[str, Tuple[str, float, float]]):
+    def _handle_continuous_features(self, continuous_features: dict[str, tuple[str, float, float]]):
         # Make dictionary GUI name: range values
         gui_values: dict[str, tuple[float,float]] = {gui_key: (tuple_values[1], tuple_values[2]) for gui_key, tuple_values in continuous_features.items()}
         # Map GUI name to Model name
         gui_to_model: dict[str,str] = {gui_key: tuple_values[0] for gui_key, tuple_values in continuous_features.items()}
         return gui_values, gui_to_model
-    def _handle_binary_features(self, binary_features: Dict[str, str]):
+    def _handle_binary_features(self, binary_features: dict[str, str]):
         # Make dictionary GUI name: range values
         gui_values: dict[str, tuple[Literal["False"],Literal["True"]]] = {gui_key: ("False", "True") for gui_key in binary_features.keys()}
         # Map GUI name to Model name (same as input)
         return gui_values
-    def _handle_multi_binary_features(self, multi_binary_features: Dict[str, Dict[str, str]]):
+    def _handle_multi_binary_features(self, multi_binary_features: dict[str, dict[str, str]]):
         # Make dictionary GUI name: range values
         gui_values: dict[str, tuple[str,...]] = {
             gui_key: tuple(nested_dict.keys())
@@ -717,13 +716,13 @@ class DragonFeatureMaster:
         # Map GUI name to Model name and preserve internal mapping (same as input)
         return gui_values
-    def _handle_one_hot_features(self, one_hot_features: Dict[str, Dict[str,str]]):
+    def _handle_one_hot_features(self, one_hot_features: dict[str, dict[str,str]]):
         # Make dictionary GUI name: range values
         gui_values: dict[str, tuple[str,...]] = {gui_key: tuple(nested_dict.keys()) for gui_key, nested_dict in one_hot_features.items()}
         # Map GUI name to Model name and preserve internal mapping (same as input)
         return gui_values
-    def _handle_categorical_features(self, categorical_features: List[Tuple[str, str, Dict[str, int]]]):
+    def _handle_categorical_features(self, categorical_features: list[tuple[str, str, dict[str, int]]]):
         # Make dictionary GUI name: range values
         gui_values: dict[str, tuple[str,...]] = {gui_key: tuple(gui_options.keys()) for gui_key, _, gui_options in categorical_features}
         # Map GUI name to Model name and preserve internal mapping
@@ -939,7 +938,7 @@ class DragonGUIHandler:
         # Feature master instance
         self.master = feature_handler
-    def _process_continuous(self, gui_feature: str, chosen_value: Any) -> Tuple[str,float]:
+    def _process_continuous(self, gui_feature: str, chosen_value: Any) -> tuple[str,float]:
         """
         Maps GUI name to model expected name and casts the value to float.
         """
@@ -955,7 +954,7 @@ class DragonGUIHandler:
         else:
             return model_name, float_value
-    def _process_binary(self, gui_feature: str, chosen_value: str) -> Tuple[str,int]:
+    def _process_binary(self, gui_feature: str, chosen_value: str) -> tuple[str,int]:
         """
         Maps GUI name to model expected name and casts the value to binary (0,1).
         """
@@ -996,7 +995,7 @@ class DragonGUIHandler:
             return results
-    def _process_one_hot(self, gui_feature: str, chosen_value: str) -> Dict[str,int]:
+    def _process_one_hot(self, gui_feature: str, chosen_value: str) -> dict[str,int]:
         """
         Maps GUI names to model expected names and casts values to one-hot encoding.
         """
@@ -1019,7 +1018,7 @@ class DragonGUIHandler:
             return results
-    def _process_categorical(self, gui_feature: str, chosen_value: str) -> Tuple[str,int]:
+    def _process_categorical(self, gui_feature: str, chosen_value: str) -> tuple[str,int]:
         """
         Maps GUI name to model expected name and casts the value to a categorical number.
         """
@@ -1034,7 +1033,7 @@ class DragonGUIHandler:
             result = categorical_mapping[chosen_value]
             return model_name, result
-    def update_target_fields(self, window: sg.Window, inference_results: Dict[str, Any]):
+    def update_target_fields(self, window: sg.Window, inference_results: dict[str, Any]):
         """
         Updates the GUI's target fields with inference results.
@@ -1051,8 +1050,8 @@ class DragonGUIHandler:
             display_value = f"{result:.2f}" if isinstance(result, (int, float)) else result
             window[gui_key].update(display_value) # type: ignore
-    def _call_subprocess(self, window_values: Dict[str,Any], master_feature: Dict[str,str], processor: Callable) -> Dict[str, Union[float,int]]:
-        processed_features_subset: Dict[str, Union[float,int]] = dict()
+    def _call_subprocess(self, window_values: dict[str,Any], master_feature: dict[str,str], processor: Callable) -> dict[str, Union[float,int]]:
+        processed_features_subset: dict[str, Union[float,int]] = dict()
         for gui_name in master_feature.keys():
             chosen_value = window_values.get(gui_name)
@@ -1071,12 +1070,12 @@ class DragonGUIHandler:
         return processed_features_subset
-    def process_features(self,  window_values: Dict[str, Any]) -> np.ndarray:
+    def process_features(self,  window_values: dict[str, Any]) -> np.ndarray:
         """
         Translates GUI values to a model-expected input array, returning a 1D numpy array.
         """
         # Stage 1: Process GUI inputs into a dictionary
-        processed_features: Dict[str, Union[float,int]] = {}
+        processed_features: dict[str, Union[float,int]] = {}
         if self.master.has_continuous:
             processed_subset = self._call_subprocess(window_values=window_values,
@@ -1109,7 +1108,7 @@ class DragonGUIHandler:
             processed_features.update(processed_subset)
         # Stage 2: Assemble the final vector using the model's required order
-        final_vector: List[float] = list()
+        final_vector: list[float] = list()
         try:
             for feature_name in self.model_expected_features:
@@ -1119,5 +1118,3 @@ class DragonGUIHandler:
         return np.array(final_vector, dtype=np.float32)
-def info():
-    _script_info(__all__)

ml_tools/{GUI_tools.py → GUI_tools/__init__.py} RENAMED Viewed

@@ -1,16 +1,18 @@
-from ._core._GUI_tools import (
+from ._GUI_tools import (
     DragonGUIConfig,
     DragonGUIFactory,
-    catch_exceptions,
     DragonFeatureMaster,
     DragonGUIHandler,
-    info
+    catch_exceptions,
 )
+from ._imprimir import info
 __all__ = [
     "DragonGUIConfig",
     "DragonGUIFactory",
-    "catch_exceptions",
     "DragonFeatureMaster",
-    "DragonGUIHandler"
+    "DragonGUIHandler",
+    "catch_exceptions",
 ]

ml_tools/GUI_tools/_imprimir.py ADDED Viewed

@@ -0,0 +1,12 @@
+from .._core import _imprimir_disponibles
+_GRUPOS = [
+    "DragonGUIConfig",
+    "DragonGUIFactory",
+    "DragonFeatureMaster",
+    "DragonGUIHandler",
+    "catch_exceptions"
+]
+def info():
+    _imprimir_disponibles(_GRUPOS)

dragon-ml-toolbox 19.14.0__py3-none-any.whl → 20.0.0__py3-none-any.whl

dragon-ml-toolbox 19.14.0py3-none-any.whl → 20.0.0py3-none-any.whl