PyPI - dragon-ml-toolbox - Versions diffs - 14.3.1__py3-none-any.whl → 16.0.0__py3-none-any.whl - Mend

dragon-ml-toolbox 14.3.1py3-none-any.whl → 16.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of dragon-ml-toolbox might be problematic. Click here for more details.

Files changed (44) hide show

{dragon_ml_toolbox-14.3.1.dist-info → dragon_ml_toolbox-16.0.0.dist-info}/METADATA +10 -5
dragon_ml_toolbox-16.0.0.dist-info/RECORD +51 -0
ml_tools/ETL_cleaning.py +20 -20
ml_tools/ETL_engineering.py +23 -25
ml_tools/GUI_tools.py +20 -20
ml_tools/MICE_imputation.py +3 -3
ml_tools/ML_callbacks.py +43 -26
ml_tools/ML_configuration.py +309 -0
ml_tools/ML_datasetmaster.py +220 -260
ml_tools/ML_evaluation.py +317 -81
ml_tools/ML_evaluation_multi.py +127 -36
ml_tools/ML_inference.py +249 -207
ml_tools/ML_models.py +13 -102
ml_tools/ML_models_advanced.py +1 -1
ml_tools/ML_optimization.py +12 -12
ml_tools/ML_scaler.py +11 -11
ml_tools/ML_sequence_datasetmaster.py +341 -0
ml_tools/ML_sequence_evaluation.py +215 -0
ml_tools/ML_sequence_inference.py +391 -0
ml_tools/ML_sequence_models.py +139 -0
ml_tools/ML_trainer.py +1247 -338
ml_tools/ML_utilities.py +51 -2
ml_tools/ML_vision_datasetmaster.py +262 -118
ml_tools/ML_vision_evaluation.py +26 -6
ml_tools/ML_vision_inference.py +117 -140
ml_tools/ML_vision_models.py +15 -1
ml_tools/ML_vision_transformers.py +233 -7
ml_tools/PSO_optimization.py +6 -6
ml_tools/SQL.py +4 -4
ml_tools/{keys.py → _keys.py} +45 -1
ml_tools/_schema.py +1 -1
ml_tools/ensemble_evaluation.py +54 -11
ml_tools/ensemble_inference.py +7 -33
ml_tools/ensemble_learning.py +1 -1
ml_tools/optimization_tools.py +2 -2
ml_tools/path_manager.py +5 -5
ml_tools/utilities.py +1 -2
dragon_ml_toolbox-14.3.1.dist-info/RECORD +0 -48
ml_tools/RNN_forecast.py +0 -56
ml_tools/_ML_vision_recipe.py +0 -88
{dragon_ml_toolbox-14.3.1.dist-info → dragon_ml_toolbox-16.0.0.dist-info}/WHEEL +0 -0
{dragon_ml_toolbox-14.3.1.dist-info → dragon_ml_toolbox-16.0.0.dist-info}/licenses/LICENSE +0 -0
{dragon_ml_toolbox-14.3.1.dist-info → dragon_ml_toolbox-16.0.0.dist-info}/licenses/LICENSE-THIRD-PARTY.md +0 -0
{dragon_ml_toolbox-14.3.1.dist-info → dragon_ml_toolbox-16.0.0.dist-info}/top_level.txt +0 -0

ml_tools/ML_vision_evaluation.py CHANGED Viewed

@@ -18,7 +18,8 @@ from torchmetrics.detection import MeanAveragePrecision
 from .path_manager import make_fullpath
 from ._logger import _LOGGER
 from ._script_info import _script_info
-from .keys import VisionKeys
+from ._keys import VisionKeys
+from .ML_configuration import SegmentationMetricsFormat
 __all__ = [
@@ -26,12 +27,15 @@ __all__ = [
     "object_detection_metrics"
 ]
+DPI_value = 250
 def segmentation_metrics(
     y_true: np.ndarray,
     y_pred: np.ndarray,
     save_dir: Union[str, Path],
-    class_names: Optional[List[str]] = None
+    class_names: Optional[List[str]] = None,
+    config: Optional[SegmentationMetricsFormat] = None # Add config object
 ):
     """
     Calculates and saves pixel-level metrics for segmentation tasks.
@@ -48,9 +52,18 @@ def segmentation_metrics(
         y_pred (np.ndarray): Predicted masks (e.g., shape [N, H, W]).
         save_dir (str | Path): Directory to save the metrics report and plots.
         class_names (List[str] | None): Names of the classes for the report.
+        config (SegmentationMetricsFormat, optional): Formatting configuration object.
     """
     save_dir_path = make_fullpath(save_dir, make=True, enforce="directory")
+    # --- Parse Config or use defaults ---
+    if config is None:
+        config = SegmentationMetricsFormat()
+    # --- Set Matplotlib font size ---
+    original_rc_params = plt.rcParams.copy()
+    plt.rcParams.update({'font.size': config.font_size})
     # Get all unique class labels present in either true or pred
     labels = np.unique(np.concatenate((np.unique(y_true), np.unique(y_pred)))).astype(int)
@@ -110,7 +123,7 @@ def segmentation_metrics(
     report_lines.append(per_class_df.to_string(index=False, float_format="%.4f"))
     report_string = "\n".join(report_lines)
-    print(report_string)
+    # print(report_string) # <-- I removed the print(report_string)
     # Save text report
     save_filename = VisionKeys.SEGMENTATION_REPORT + ".txt"
@@ -120,11 +133,11 @@ def segmentation_metrics(
     # --- 3. Save Per-Class Metrics Heatmap ---
     try:
-        plt.figure(figsize=(max(8, len(labels) * 0.5), 6), dpi=100)
+        plt.figure(figsize=(max(8, len(labels) * 0.5), 6), dpi=DPI_value)
         sns.heatmap(
             per_class_df.set_index('Class').T,
             annot=True,
-            cmap='viridis',
+            cmap=config.heatmap_cmap, # Use config cmap
             fmt='.3f',
             linewidths=0.5
         )
@@ -149,7 +162,11 @@ def segmentation_metrics(
             confusion_matrix=cm,
             display_labels=display_names
         )
-        disp.plot(cmap='Blues', ax=ax_cm, xticks_rotation=45)
+        disp.plot(cmap=config.cm_cmap, ax=ax_cm, xticks_rotation=45) # Use config cmap
+        # Manually update font size of cell texts
+        for text in disp.text_.flatten(): # type: ignore
+            text.set_fontsize(config.font_size)
         ax_cm.set_title("Pixel-Level Confusion Matrix")
         plt.tight_layout()
@@ -160,6 +177,9 @@ def segmentation_metrics(
         plt.close(fig_cm)
     except Exception as e:
         _LOGGER.error(f"Could not generate confusion matrix: {e}")
+    # --- Restore RC params ---
+    plt.rcParams.update(original_rc_params)
 def object_detection_metrics(

ml_tools/ML_vision_inference.py CHANGED Viewed

@@ -8,32 +8,29 @@ from torchvision import transforms
 from ._script_info import _script_info
 from ._logger import _LOGGER
-from .path_manager import make_fullpath
-from .keys import PyTorchInferenceKeys, PyTorchCheckpointKeys
-from ._ML_vision_recipe import load_recipe_and_build_transform
+from ._keys import PyTorchInferenceKeys, MLTaskKeys
+from .ML_vision_transformers import _load_recipe_and_build_transform
+from .ML_inference import _BaseInferenceHandler
 __all__ = [
-    "PyTorchVisionInferenceHandler"
+    "DragonVisionInferenceHandler"
 ]
-class PyTorchVisionInferenceHandler:
+class DragonVisionInferenceHandler(_BaseInferenceHandler):
     """
     Handles loading a PyTorch vision model's state dictionary and performing inference.
     This class is specifically for vision models, which typically expect
     4D Tensors (B, C, H, W) or Lists of Tensors as input.
-    It does NOT use a scaler, as preprocessing (e.g., normalization)
-    is assumed to be part of the input transform pipeline.
     """
     def __init__(self,
                  model: nn.Module,
                  state_dict: Union[str, Path],
-                 task: Literal["image_classification", "image_segmentation", "object_detection"],
+                 task: Literal["binary image classification", "multiclass image classification", "binary segmentation", "multiclass segmentation", "object detection"],
                  device: str = 'cpu',
-                 transform_source: Optional[Union[str, Path, Callable]] = None,
-                 class_map: Optional[Dict[str, int]] = None):
+                 transform_source: Optional[Union[str, Path, Callable]] = None):
         """
         Initializes the vision inference handler.
@@ -46,19 +43,17 @@ class PyTorchVisionInferenceHandler:
                 - A path to a .json recipe file (str or Path).
                 - A pre-built transformation pipeline (Callable).
                 - None, in which case .set_transform() must be called explicitly to set transformations.
-            idx_to_class (Dict[int, str] | None): Sets the class name mapping to translate predicted integer labels back into string names. (For image classification and object detection)
+        Note: class_map (Dict[int, str]) will be loaded from the model file, to set or override it use `.set_class_map()`.
         """
-        self._model = model
-        self._device = self._validate_device(device)
+        super().__init__(model, state_dict, device, None)
         self._transform: Optional[Callable] = None
         self._is_transformed: bool = False
-        self._idx_to_class: Optional[Dict[int, str]] = None
-        if class_map is not None:
-            self.set_class_map(class_map)
-        if task not in ["image_classification", "image_segmentation", "object_detection"]:
-            _LOGGER.error(f"`task` must be 'image_classification', 'image_segmentation', or 'object_detection'. Got '{task}'.")
-            raise ValueError("Invalid task type.")
+        if task not in [MLTaskKeys.BINARY_IMAGE_CLASSIFICATION, MLTaskKeys.MULTICLASS_IMAGE_CLASSIFICATION, MLTaskKeys.BINARY_SEGMENTATION, MLTaskKeys.MULTICLASS_SEGMENTATION, MLTaskKeys.OBJECT_DETECTION]:
+            _LOGGER.error(f"Unsupported task: '{task}'.")
+            raise ValueError()
         self.task = task
         self.expected_in_channels: int = 3 # Default to RGB
@@ -71,39 +66,6 @@ class PyTorchVisionInferenceHandler:
         if transform_source:
             self.set_transform(transform_source)
             self._is_transformed = True
-        model_p = make_fullpath(state_dict, enforce="file")
-        try:
-            # Load whatever is in the file
-            loaded_data = torch.load(model_p, map_location=self._device)
-            # Check if it's a new checkpoint dictionary or an old weights-only file
-            if isinstance(loaded_data, dict) and PyTorchCheckpointKeys.MODEL_STATE in loaded_data:
-                # It's a new training checkpoint, extract the weights
-                self._model.load_state_dict(loaded_data[PyTorchCheckpointKeys.MODEL_STATE])
-            else:
-                # It's an old-style file (or just a state_dict), load it directly
-                self._model.load_state_dict(loaded_data)
-            _LOGGER.info(f"Model state loaded from '{model_p.name}'.")
-            self._model.to(self._device)
-            self._model.eval()  # Set the model to evaluation mode
-        except Exception as e:
-            _LOGGER.error(f"Failed to load model state from '{model_p}': {e}")
-            raise
-    def _validate_device(self, device: str) -> torch.device:
-        """Validates the selected device and returns a torch.device object."""
-        device_lower = device.lower()
-        if "cuda" in device_lower and not torch.cuda.is_available():
-            _LOGGER.warning("CUDA not available, switching to CPU.")
-            device_lower = "cpu"
-        elif device_lower == "mps" and not torch.backends.mps.is_available():
-            _LOGGER.warning("Apple Metal Performance Shaders (MPS) not available, switching to CPU.")
-            device_lower = "cpu"
-        return torch.device(device_lower)
     def _preprocess_batch(self, inputs: Union[torch.Tensor, List[torch.Tensor]]) -> Union[torch.Tensor, List[torch.Tensor]]:
         """
@@ -111,23 +73,23 @@ class PyTorchVisionInferenceHandler:
         - For Classification/Segmentation: Expects 4D Tensor (B, C, H, W).
         - For Object Detection: Expects List[Tensor(C, H, W)].
         """
-        if self.task == "object_detection":
+        if self.task == MLTaskKeys.OBJECT_DETECTION:
             if not isinstance(inputs, list) or not all(isinstance(t, torch.Tensor) for t in inputs):
                 _LOGGER.error("Input for object_detection must be a List[torch.Tensor].")
                 raise ValueError("Invalid input type for object detection.")
             # Move each tensor in the list to the device
-            return [t.float().to(self._device) for t in inputs]
+            return [t.float().to(self.device) for t in inputs]
         else: # Classification or Segmentation
             if not isinstance(inputs, torch.Tensor):
                 _LOGGER.error(f"Input for {self.task} must be a torch.Tensor.")
                 raise ValueError(f"Invalid input type for {self.task}.")
-            if inputs.ndim != 4:
-                 _LOGGER.error(f"Input tensor for {self.task} must be 4D (B, C, H, W). Got {inputs.ndim}D.")
+            if inputs.ndim != 4: # type: ignore
+                 _LOGGER.error(f"Input tensor for {self.task} must be 4D (B, C, H, W). Got {inputs.ndim}D.") # type: ignore
                  raise ValueError("Input tensor must be 4D.")
-            return inputs.float().to(self._device)
+            return inputs.float().to(self.device)
     def set_transform(self, transform_source: Union[str, Path, Callable]):
         """
@@ -144,8 +106,8 @@ class PyTorchVisionInferenceHandler:
         if isinstance(transform_source, (str, Path)):
             _LOGGER.info(f"Loading transform from recipe file: '{transform_source}'")
             try:
-                # Use the new loader function
-                self._transform = load_recipe_and_build_transform(transform_source)
+                # Use the loader function
+                self._transform = _load_recipe_and_build_transform(transform_source)
             except Exception as e:
                 _LOGGER.error(f"Failed to load transform from recipe '{transform_source}': {e}")
                 raise
@@ -155,31 +117,15 @@ class PyTorchVisionInferenceHandler:
         else:
             _LOGGER.error(f"Invalid transform_source type: {type(transform_source)}. Must be str, Path, or Callable.")
             raise TypeError("transform_source must be a file path or a Callable.")
-    def set_class_map(self, class_map: Dict[str, int]):
-        """
-        Sets the class name mapping to translate predicted integer labels
-        back into string names.
-        Args:
-            class_map (Dict[str, int]): The class_to_idx dictionary
-                (e.g., {'cat': 0, 'dog': 1}) from the VisionDatasetMaker.
-        """
-        if self._idx_to_class is not None:
-            _LOGGER.warning("Class to index mapping was previously given. Setting new mapping...")
-        # Invert the dictionary for fast lookup
-        self._idx_to_class = {v: k for k, v in class_map.items()}
-        _LOGGER.info("Class map set for label-to-name translation.")
     def predict_batch(self, inputs: Union[torch.Tensor, List[torch.Tensor]]) -> Dict[str, Any]:
         """
         Core batch prediction method for vision models.
-        All preprocessing (resizing, normalization) should be done *before*
-        calling this method.
+        All preprocessing (resizing, normalization) should be done *before* calling this method.
         Args:
             inputs (torch.Tensor | List[torch.Tensor]):
-                - For 'image_classification' or 'image_segmentation',
+                - For binary/multiclass image classification or binary/multiclass image segmentation tasks,
                   a 4D torch.Tensor (B, C, H, W).
                 - For 'object_detection', a List of 3D torch.Tensors
                   [(C, H, W), ...], each with its own size.
@@ -194,45 +140,55 @@ class PyTorchVisionInferenceHandler:
         processed_inputs = self._preprocess_batch(inputs)
         with torch.no_grad():
-            if self.task == "image_classification":
-                # --- Image Classification ---
-                # 1. Predict
-                output = self._model(processed_inputs) # (B, num_classes)
-                # 2. Post-process
+            # get outputs
+            output = self.model(processed_inputs)
+            if self.task == MLTaskKeys.MULTICLASS_IMAGE_CLASSIFICATION:
+                # process
                 probs = torch.softmax(output, dim=1)
                 labels = torch.argmax(probs, dim=1)
                 return {
                     PyTorchInferenceKeys.LABELS: labels,       # (B,)
                     PyTorchInferenceKeys.PROBABILITIES: probs  # (B, num_classes)
                 }
-            elif self.task == "image_segmentation":
-                # --- Image Segmentation ---
-                # 1. Predict
-                output = self._model(processed_inputs) # (B, num_classes, H, W)
+            elif self.task == MLTaskKeys.BINARY_IMAGE_CLASSIFICATION:
+                # Assumes model output is [N, 1] (a single logit)
+                # Squeeze output from [N, 1] to [N] if necessary
+                if output.ndim == 2 and output.shape[1] == 1:
+                    output = output.squeeze(1)
+                probs = torch.sigmoid(output) # Probability of positive class
+                labels = (probs >= self._classification_threshold).int()
+                return {
+                    PyTorchInferenceKeys.LABELS: labels,
+                    PyTorchInferenceKeys.PROBABILITIES: probs
+                }
+            elif self.task == MLTaskKeys.BINARY_SEGMENTATION:
+                # Assumes model output is [N, 1, H, W] (logits for positive class)
+                probs = torch.sigmoid(output) # Shape [N, 1, H, W]
+                labels = (probs >= self._classification_threshold).int() # Shape [N, 1, H, W]
+                return {
+                    PyTorchInferenceKeys.LABELS: labels,
+                    PyTorchInferenceKeys.PROBABILITIES: probs
+                }
-                # 2. Post-process
-                probs = torch.softmax(output, dim=1) # Probs across class channel
-                labels = torch.argmax(probs, dim=1)  # (B, H, W) segmentation map
+            elif self.task == MLTaskKeys.MULTICLASS_SEGMENTATION:
+                # output shape [N, C, H, W]
+                probs = torch.softmax(output, dim=1)
+                labels = torch.argmax(probs, dim=1) # shape [N, H, W]
                 return {
-                    PyTorchInferenceKeys.LABELS: labels,       # (B, H, W)
-                    PyTorchInferenceKeys.PROBABILITIES: probs  # (B, num_classes, H, W)
+                    PyTorchInferenceKeys.LABELS: labels,       # (N, H, W)
+                    PyTorchInferenceKeys.PROBABILITIES: probs  # (N, num_classes, H, W)
                 }
-            elif self.task == "object_detection":
-                # --- Object Detection ---
-                # 1. Predict (model is in eval mode, expects only images)
-                # Output is List[Dict[str, Tensor('boxes', 'labels', 'scores')]]
-                predictions = self._model(processed_inputs)
-                # 2. Post-process: Wrap in our standard key
+            elif self.task == MLTaskKeys.OBJECT_DETECTION:
                 return {
-                    PyTorchInferenceKeys.PREDICTIONS: predictions
+                    PyTorchInferenceKeys.PREDICTIONS: output
                 }
             else:
-                # This should be unreachable due to __init__ check
+                # This should be unreachable due to validation
                 raise ValueError(f"Unknown task: {self.task}")
     def predict(self, single_input: torch.Tensor) -> Dict[str, Any]:
@@ -248,24 +204,24 @@ class PyTorchVisionInferenceHandler:
         Returns:
             A dictionary containing the output tensors for a single sample.
             - Classification: {labels, probabilities} (label is 0-dim)
-            - Segmentation: {labels, probabilities} (label is 2D mask)
+            - Segmentation: {labels, probabilities} (label is a 2D (multiclass) or 3D (binary) mask)
             - Object Detection: {boxes, labels, scores} (single dict)
         """
         if not isinstance(single_input, torch.Tensor) or single_input.ndim != 3:
              _LOGGER.error(f"Input for predict() must be a 3D tensor (C, H, W). Got {single_input.ndim}D.")
-             raise ValueError("Input must be a 3D tensor.")
+             raise ValueError()
         # --- 1. Batch the input based on task ---
-        if self.task == "object_detection":
+        if self.task == MLTaskKeys.OBJECT_DETECTION:
             batched_input = [single_input] # List of one tensor
         else:
-            batched_input = single_input.unsqueeze(0) # (1, C, H, W)
+            batched_input = single_input.unsqueeze(0)
         # --- 2. Call batch prediction ---
         batch_results = self.predict_batch(batched_input)
         # --- 3. Un-batch the results ---
-        if self.task == "object_detection":
+        if self.task == MLTaskKeys.OBJECT_DETECTION:
             # batch_results['predictions'] is a List[Dict]. We want the first (and only) Dict.
             return batch_results[PyTorchInferenceKeys.PREDICTIONS][0]
         else:
@@ -283,12 +239,12 @@ class PyTorchVisionInferenceHandler:
         Returns:
             Dict: A dictionary containing the outputs as NumPy arrays.
             - Obj. Detection: {predictions: List[Dict[str, np.ndarray]]}
-            - Classification: {labels: int, label_names: str, probabilities: np.ndarray}
+            - Classification: {labels: np.ndarray, label_names: List[str], probabilities: np.ndarray}
             - Segmentation: {labels: np.ndarray, probabilities: np.ndarray}
         """
         tensor_results = self.predict_batch(inputs)
-        if self.task == "object_detection":
+        if self.task == MLTaskKeys.OBJECT_DETECTION:
             # Output is List[Dict[str, Tensor]]
             # Convert each tensor inside each dict to numpy
             numpy_results = []
@@ -304,13 +260,19 @@ class PyTorchVisionInferenceHandler:
                     ]
                 numpy_results.append(np_dict)
             return {PyTorchInferenceKeys.PREDICTIONS: numpy_results}
         else:
-            # Output is Dict[str, Tensor]
+            # Output is Dict[str, Tensor] (for Classification or Segmentation)
             numpy_results = {key: value.cpu().numpy() for key, value in tensor_results.items()}
             # Add string names for classification if map exists
-            if self.task == "image_classification" and self._idx_to_class and PyTorchInferenceKeys.LABELS in numpy_results:
-                int_labels = numpy_results[PyTorchInferenceKeys.LABELS]
+            is_image_classification = self.task in [
+                MLTaskKeys.BINARY_IMAGE_CLASSIFICATION,
+                MLTaskKeys.MULTICLASS_IMAGE_CLASSIFICATION
+            ]
+            if is_image_classification and self._idx_to_class and PyTorchInferenceKeys.LABELS in numpy_results:
+                int_labels = numpy_results[PyTorchInferenceKeys.LABELS] # This is a (B,) array
                 numpy_results[PyTorchInferenceKeys.LABEL_NAMES] = [
                     self._idx_to_class.get(label_id, "Unknown")
                     for label_id in int_labels
@@ -324,13 +286,13 @@ class PyTorchVisionInferenceHandler:
         Returns:
             Dict: A dictionary containing the outputs as NumPy arrays/scalars.
-            - Obj. Detection: {boxes: np.ndarray, labels: np.ndarray, scores: np.ndarray}
+            - Obj. Detection: {boxes: np.ndarray, labels: np.ndarray, scores: np.ndarray, label_names: List[str]}
             - Classification: {labels: int, label_names: str, probabilities: np.ndarray}
             - Segmentation: {labels: np.ndarray, probabilities: np.ndarray}
         """
         tensor_results = self.predict(single_input)
-        if self.task == "object_detection":
+        if self.task == MLTaskKeys.OBJECT_DETECTION:
             # Output is Dict[str, Tensor]
             # Convert each tensor to numpy
             numpy_results = {
@@ -348,7 +310,7 @@ class PyTorchVisionInferenceHandler:
             return numpy_results
-        elif self.task == "image_classification":
+        elif self.task in [MLTaskKeys.BINARY_IMAGE_CLASSIFICATION, MLTaskKeys.MULTICLASS_IMAGE_CLASSIFICATION]:
             # Output is Dict[str, Tensor(0-dim) or Tensor(1-dim)]
             int_label = tensor_results[PyTorchInferenceKeys.LABELS].item()
             label_name = "Unknown"
@@ -360,50 +322,32 @@ class PyTorchVisionInferenceHandler:
                 PyTorchInferenceKeys.LABEL_NAMES: label_name,
                 PyTorchInferenceKeys.PROBABILITIES: tensor_results[PyTorchInferenceKeys.PROBABILITIES].cpu().numpy()
             }
-        else: # image_segmentation
+        else: # image_segmentation (binary or multiclass)
             # Output is Dict[str, Tensor(2D) or Tensor(3D)]
             return {
                 PyTorchInferenceKeys.LABELS: tensor_results[PyTorchInferenceKeys.LABELS].cpu().numpy(),
                 PyTorchInferenceKeys.PROBABILITIES: tensor_results[PyTorchInferenceKeys.PROBABILITIES].cpu().numpy()
             }
-    def predict_from_file(self, image_path: Union[str, Path]) -> Dict[str, Any]:
+    def predict_from_pil(self, image: Image.Image) -> Dict[str, Any]:
         """
-        Loads a single image from a file, applies the stored transform, and returns the prediction.
+        Applies the stored transform to a single PIL image and returns the prediction.
         Args:
-            image_path (str | Path): The file path to the input image.
+            image (PIL.Image.Image): The input PIL image.
         Returns:
             Dict: A dictionary containing the prediction results. See `predict_numpy()` for task-specific output structures.
         """
         if self._transform is None:
-            _LOGGER.error("Cannot predict from file: No transform has been set. Call .set_transform() or provide transform_source in __init__.")
+            _LOGGER.error("Cannot predict from PIL image: No transform has been set. Call .set_transform() or provide transform_source in __init__.")
             raise RuntimeError("Inference transform is not set.")
-        try:
-            # --- Use expected_in_channels to set PIL mode ---
-            pil_mode: str
-            if self.expected_in_channels == 1:
-                pil_mode = "L"  # Grayscale
-            elif self.expected_in_channels == 4:
-                pil_mode = "RGBA" # RGB + Alpha
-            else:
-                if self.expected_in_channels != 3: # 2, 5+ channels not supported by PIL convert
-                    _LOGGER.warning(f"Model expects {self.expected_in_channels} channels. PIL conversion is limited, defaulting to 3 channels (RGB). The transformations must convert it to the desired channel dimensions.")
-                # Default to RGB. If 2-channels are needed, the transform recipe *must* be responsible for handling the conversion from a 3-channel PIL image.
-                pil_mode = "RGB"
-            image = Image.open(image_path).convert(pil_mode)
-        except Exception as e:
-            _LOGGER.error(f"Failed to load and convert image from '{image_path}': {e}")
-            raise
         # Apply the transformation pipeline (e.g., resize, crop, ToTensor, normalize)
         try:
             transformed_image = self._transform(image)
         except Exception as e:
-            _LOGGER.error(f"Error applying transform to image: {e}")
+            _LOGGER.error(f"Error applying transform to PIL image: {e}")
             raise
         # --- Validation ---
@@ -413,7 +357,7 @@ class PyTorchVisionInferenceHandler:
         if transformed_image.ndim != 3:
             _LOGGER.warning(f"Expected transform to output a 3D (C, H, W) tensor, but got {transformed_image.ndim}D. Attempting to proceed.")
-            # .predict() which expects a 3D tensor
+            # .predict_numpy() -> .predict() which expects a 3D tensor
             if transformed_image.ndim == 4 and transformed_image.shape[0] == 1:
                 transformed_image = transformed_image.squeeze(0) # Fix if user's transform adds a batch dim
                 _LOGGER.warning("Removed an extra batch dimension.")
@@ -423,6 +367,39 @@ class PyTorchVisionInferenceHandler:
         # Use the existing single-item predict method
         return self.predict_numpy(transformed_image)
+    def predict_from_file(self, image_path: Union[str, Path]) -> Dict[str, Any]:
+        """
+        Loads a single image from a file, applies the stored transform, and returns the prediction.
+        This is a convenience wrapper that loads the image and calls `predict_from_pil()`.
+        Args:
+            image_path (str | Path): The file path to the input image.
+        Returns:
+            Dict: A dictionary containing the prediction results. See `predict_numpy()` for task-specific output structures.
+        """
+        try:
+            # --- Use expected_in_channels to set PIL mode ---
+            pil_mode: str
+            if self.expected_in_channels == 1:
+                pil_mode = "L"  # Grayscale
+            elif self.expected_in_channels == 4:
+                pil_mode = "RGBA" # RGB + Alpha
+            else:
+                if self.expected_in_channels != 3: # 2, 5+ channels not supported by PIL convert
+                    _LOGGER.warning(f"Model expects {self.expected_in_channels} channels. PIL conversion is limited, defaulting to 3 channels (RGB). The transformations must convert it to the desired channel dimensions.")
+                # Default to RGB. If 2-channels are needed, the transform recipe *must* be responsible for handling the conversion from a 3-channel PIL image.
+                pil_mode = "RGB"
+            image = Image.open(image_path).convert(pil_mode)
+        except Exception as e:
+            _LOGGER.error(f"Failed to load and convert image from '{image_path}': {e}")
+            raise
+        # Call the PIL-based prediction method
+        return self.predict_from_pil(image)
 def info():
     _script_info(__all__)

ml_tools/ML_vision_models.py CHANGED Viewed

@@ -47,12 +47,17 @@ class _BaseVisionWrapper(nn.Module, _ArchitectureHandlerMixin, ABC):
         self.num_classes = num_classes
         self.in_channels = in_channels
         self.model_name = model_name
+        self._pretrained_default_transforms = None
         # --- 2. Instantiate the base model ---
         if init_with_pretrained:
             weights_enum = getattr(vision_models, weights_enum_name, None) if weights_enum_name else None
             weights = weights_enum.IMAGENET1K_V1 if weights_enum else None
+            # Save transformations for pretrained models
+            if weights:
+                self._pretrained_default_transforms = weights.transforms()
             if weights is None and init_with_pretrained:
                  _LOGGER.warning(f"Could not find modern weights for {model_name}. Using 'pretrained=True' legacy fallback.")
                  self.model = getattr(vision_models, model_name)(pretrained=True)
@@ -331,6 +336,7 @@ class _BaseSegmentationWrapper(nn.Module, _ArchitectureHandlerMixin, ABC):
         self.num_classes = num_classes
         self.in_channels = in_channels
         self.model_name = model_name
+        self._pretrained_default_transforms = None
         # --- 2. Instantiate the base model ---
         model_kwargs = {
@@ -343,6 +349,10 @@ class _BaseSegmentationWrapper(nn.Module, _ArchitectureHandlerMixin, ABC):
             weights_enum = getattr(vision_models.segmentation, weights_enum_name, None) if weights_enum_name else None
             weights = weights_enum.DEFAULT if weights_enum else None
+            # save pretrained model transformations
+            if weights:
+                self._pretrained_default_transforms = weights.transforms()
             if weights is None:
                  _LOGGER.warning(f"Could not find modern weights for {model_name}. Using 'pretrained=True' legacy fallback.")
                  # Legacy models used 'pretrained=True' and num_classes was separate
@@ -520,7 +530,7 @@ class DragonFastRCNN(nn.Module, _ArchitectureHandlerMixin):
     This wrapper allows for customizing the model backbone, input channels,
     and the number of output classes for transfer learning.
-    NOTE: This model is NOT compatible with the MLTrainer class.
+    NOTE: Use an Object Detection compatible trainer.
     """
     def __init__(self,
                  num_classes: int,
@@ -550,6 +560,7 @@ class DragonFastRCNN(nn.Module, _ArchitectureHandlerMixin):
         self.num_classes = num_classes
         self.in_channels = in_channels
         self.model_name = model_name
+        self._pretrained_default_transforms = None
         # --- 2. Instantiate the base model ---
         model_constructor = getattr(detection_models, model_name)
@@ -560,6 +571,9 @@ class DragonFastRCNN(nn.Module, _ArchitectureHandlerMixin):
         weights_enum = getattr(detection_models, weights_enum_name, None) if weights_enum_name else None
         weights = weights_enum.DEFAULT if weights_enum and init_with_pretrained else None
+        if weights:
+            self._pretrained_default_transforms = weights.transforms()
         self.model = model_constructor(weights=weights, weights_backbone=weights)

dragon-ml-toolbox 14.3.1__py3-none-any.whl → 16.0.0__py3-none-any.whl

Potentially problematic release.

dragon-ml-toolbox 14.3.1py3-none-any.whl → 16.0.0py3-none-any.whl