PyPI - rgb-to-segmentation - Versions diffs - 0.1.6__py3-none-any.whl - Mend

rgb-to-segmentation 0.1.6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

rgb_to_segmentation/__init__.py +10 -0
rgb_to_segmentation/api.py +123 -0
rgb_to_segmentation/clean.py +315 -0
rgb_to_segmentation/cli.py +180 -0
rgb_to_segmentation/models/__init__.py +5 -0
rgb_to_segmentation/models/base_classifier.py +77 -0
rgb_to_segmentation/models/cnn_decoder.py +103 -0
rgb_to_segmentation/models/pixelwise_classifier.py +31 -0
rgb_to_segmentation/nn.py +164 -0
rgb_to_segmentation/train.py +212 -0
rgb_to_segmentation/utils.py +40 -0
rgb_to_segmentation-0.1.6.dist-info/METADATA +213 -0
rgb_to_segmentation-0.1.6.dist-info/RECORD +15 -0
rgb_to_segmentation-0.1.6.dist-info/WHEEL +4 -0
rgb_to_segmentation-0.1.6.dist-info/entry_points.txt +3 -0

rgb_to_segmentation/__init__.py ADDED Viewed

@@ -0,0 +1,10 @@
+from .api import clean_image
+from . import clean, nn, train, utils
+__all__ = [
+	"clean_image",
+	"clean",
+	"nn",
+	"train",
+	"utils",
+]

rgb_to_segmentation/api.py ADDED Viewed

@@ -0,0 +1,123 @@
+import numpy as np
+import torch
+from typing import Dict, Tuple, Optional, Union
+from .clean import clean_image_palette, clean_image_strict_palette
+from .nn import clean_image_nn
+ImageArray = Union[np.ndarray, torch.Tensor]
+def _to_numpy(image_array: ImageArray):
+    if isinstance(image_array, np.ndarray):
+        return image_array, False, None, None
+    if isinstance(image_array, torch.Tensor):
+        return (
+            image_array.detach().cpu().numpy(),
+            True,
+            image_array.dtype,
+            image_array.device,
+        )
+    raise TypeError("image_array must be a numpy.ndarray or torch.Tensor")
+def _to_original_type(
+    np_array: np.ndarray,
+    is_torch: bool,
+    dtype: Optional[torch.dtype],
+    device: Optional[torch.device],
+) -> ImageArray:
+    if not is_torch:
+        return np_array
+    tensor = torch.from_numpy(np_array)
+    if dtype is not None and tensor.dtype != dtype:
+        tensor = tensor.to(dtype=dtype)
+    if device is not None and tensor.device != device:
+        tensor = tensor.to(device=device)
+    return tensor
+def clean_image(
+    image_array: ImageArray,
+    method: str,
+    colour_map: Dict[int, Tuple[int, int, int]],
+    *,
+    model: Optional[object] = None,
+    morph_kernel_size: int = 0,
+    output_type: str = "rgb",
+) -> ImageArray:
+    """
+    Clean a single image (numpy array or torch tensor) using the specified method.
+    Args:
+        image_array: Array/Tensor of shape (H, W, 3), dtype uint8.
+        method: "palette", "strict_palette", "pixel_decoder", or "cnn_decoder" to choose cleaning approach.
+        model: Required when method="pixel_decoder" or "cnn_decoder". A trained model with forward(batch) returning class probabilities.
+        colour_map: Required for all methods. Dict mapping class index -> (r,g,b).
+        morph_kernel_size: Optional morphological clean kernel size (palette method only).
+        output_type: "rgb" to return colour image, "index" to return integer mask.
+    Returns:
+        Cleaned image with the same container type as the input (np.ndarray or torch.Tensor):
+        (H,W,3) uint8 when output_type="rgb", otherwise (H,W) uint8.
+    """
+    np_image, is_torch, orig_dtype, orig_device = _to_numpy(image_array)
+    if np_image.ndim != 3 or np_image.shape[2] != 3:
+        raise ValueError("image_array must have shape (H, W, 3)")
+    if output_type not in ("rgb", "index"):
+        raise ValueError("output_type must be 'rgb' or 'index'")
+    if method == "palette":
+        # Build palette ndarray from colour_map in index order and delegate to core function
+        keys = sorted(colour_map.keys())
+        palette = np.asarray([colour_map[k] for k in keys], dtype=np.uint8)
+        cleaned = clean_image_palette(
+            np_image,
+            palette=palette,
+            morph_kernel_size=morph_kernel_size,
+            output_type=output_type,
+        )
+    elif method == "strict_palette":
+        cleaned = clean_image_strict_palette(
+            np_image,
+            colour_map=colour_map,
+            output_type=output_type,
+        )
+    elif method == "pixel_decoder":
+        if model is None:
+            raise ValueError("model must be provided for method='pixel_decoder'")
+        cleaned = clean_image_nn(
+            np_image,
+            model=model,
+            colour_map=colour_map,
+            output_type=output_type,
+        )
+    elif method == "cnn_decoder":
+        if model is None:
+            raise ValueError("model must be provided for method='cnn_decoder'")
+        cleaned = clean_image_nn(
+            np_image,
+            model=model,
+            colour_map=colour_map,
+            output_type=output_type,
+        )
+    else:
+        raise ValueError(
+            "method must be 'palette', 'strict_palette', 'pixel_decoder', or 'cnn_decoder'"
+        )
+    return _to_original_type(cleaned, is_torch, orig_dtype, orig_device)

rgb_to_segmentation/clean.py ADDED Viewed

@@ -0,0 +1,315 @@
+import os
+from typing import List
+import numpy as np
+from PIL import Image
+from scipy import ndimage
+import torch
+def clean_image_palette(
+    image_array: np.ndarray,
+    palette: np.ndarray,
+    morph_kernel_size: int = 0,
+    output_type: str = "rgb",
+) -> np.ndarray:
+    """
+    Clean a single RGB image using palette-based nearest-colour mapping.
+    Args:
+        image_array: (H, W, 3) uint8
+        palette: (K, 3) uint8
+        morph_kernel_size: kernel size for morphological cleaning (0 disables)
+        output_type: 'rgb' to return colour image; 'index' to return integer mask
+    Returns:
+        np.ndarray: (H,W,3) uint8 if output_type='rgb'; else (H,W) uint8
+    """
+    if output_type not in ("rgb", "index"):
+        raise ValueError("output_type must be 'rgb' or 'index'")
+    # Reduce palette to colours present in the image for efficiency
+    reduced_palette = get_palette_for_image(image_array, palette)
+    # Map to nearest colours
+    cleaned_rgb = nearest_palette_image(image_array, reduced_palette)
+    # Optional morphological clean
+    if morph_kernel_size > 0:
+        cleaned_rgb = apply_morphological_clean(cleaned_rgb, morph_kernel_size)
+    if output_type == "rgb":
+        return cleaned_rgb
+    else:
+        return rgb_image_to_index(cleaned_rgb, reduced_palette).astype(np.uint8)
+def clean_image_strict_palette(
+    image_array: np.ndarray,
+    colour_map: dict,
+    output_type: str = "rgb",
+) -> np.ndarray:
+    """
+    Strictly map RGB values to indices based on colour_map.
+    Raises an error if any RGB value is not found in the colour_map.
+    Args:
+        image_array: (H, W, 3) uint8 numpy array
+        colour_map: Dict mapping class index -> (r,g,b)
+        output_type: 'rgb' to return colour image; 'index' to return integer mask
+    Returns:
+        np.ndarray: (H,W,3) uint8 if output_type='rgb'; else (H,W) uint8
+    """
+    if output_type not in ("rgb", "index"):
+        raise ValueError("output_type must be 'rgb' or 'index'")
+    h, w, _ = image_array.shape
+    flat_img = image_array.reshape(-1, 3)
+    # Build reverse lookup: RGB tuple -> class index
+    rgb_to_idx = {tuple(map(int, rgb)): idx for idx, rgb in colour_map.items()}
+    # Find all unique RGB values in the image
+    unique_colours = np.unique(flat_img, axis=0)
+    # Check if all colours are in the colour_map
+    unmapped_colours = []
+    for colour in unique_colours:
+        colour_tuple = tuple(map(int, colour))
+        if colour_tuple not in rgb_to_idx:
+            unmapped_colours.append(colour_tuple)
+    if unmapped_colours:
+        # Format error message with unmapped colours
+        colour_strs = [f"RGB{c}" for c in unmapped_colours[:10]]  # Show first 10
+        if len(unmapped_colours) > 10:
+            colour_strs.append(f"... and {len(unmapped_colours) - 10} more")
+        raise ValueError(
+            f"Image contains {len(unmapped_colours)} RGB value(s) not in colour_map: "
+            f"{', '.join(colour_strs)}. All pixel values must exactly match a colour in the map."
+        )
+    # Map each pixel to its class index
+    flat_indices = np.array(
+        [rgb_to_idx[tuple(map(int, px))] for px in flat_img], dtype=np.uint16
+    )
+    index_image = flat_indices.reshape(h, w).astype(np.uint8)
+    if output_type == "index":
+        return index_image
+    else:
+        # Convert back to RGB using colour_map
+        rgb_output = np.zeros((h, w, 3), dtype=np.uint8)
+        for idx, rgb in colour_map.items():
+            mask = index_image == idx
+            rgb_output[mask] = rgb
+        return rgb_output
+def nearest_palette_image(image_array: np.ndarray, palette: np.ndarray) -> np.ndarray:
+    """
+    Assign each pixel in `image_array` (H,W,3 uint8) to the nearest colour in `palette` (K,3 uint8).
+    Returns recoloured image array with same shape and dtype uint8.
+    """
+    if image_array.ndim != 3 or image_array.shape[2] != 3:
+        raise ValueError("image_array must have shape (H, W, 3)")
+    h, w, _ = image_array.shape
+    flat = image_array.reshape(-1, 3).astype(np.int64)
+    pal = palette.astype(np.int64)
+    # Compute squared distances between each pixel and each palette colour.
+    # distances shape: (N_pixels, K)
+    d = np.sum((flat[:, None, :] - pal[None, :, :]) ** 2, axis=2)
+    idx = np.argmin(d, axis=1)
+    new_flat = pal[idx]
+    new = new_flat.reshape(h, w, 3).astype(np.uint8)
+    return new
+def get_palette_for_image(
+    image_array: np.ndarray, full_palette: np.ndarray
+) -> np.ndarray:
+    """
+    Identify which colours from the full palette are present in the image,
+    and return only those colours.
+    """
+    h, w, _ = image_array.shape
+    flat_img = image_array.reshape(-1, 3).astype(np.int16)
+    pal = full_palette.astype(np.int16)
+    # For each pixel, find the nearest palette colour
+    d = np.sum((flat_img[:, None, :] - pal[None, :, :]) ** 2, axis=2)
+    idx = np.argmin(d, axis=1)
+    # Get unique indices that are actually used
+    unique_idx = np.unique(idx)
+    # Return only the palette colours that are used
+    return full_palette[unique_idx]
+def apply_morphological_clean(image_array: np.ndarray, kernel_size: int) -> np.ndarray:
+    """
+    Apply morphological closing (erosion followed by dilation) per class to clean up
+    class boundaries and remove noise.
+    """
+    if kernel_size <= 0:
+        return image_array
+    # Create morphological kernel
+    kernel = ndimage.generate_binary_structure(2, 2)
+    # Get unique colours that actually appear in the image
+    h, w, _ = image_array.shape
+    flat_img = image_array.reshape(-1, 3)
+    unique_colours = np.unique(flat_img, axis=0)
+    # Process each class separately to avoid blending
+    result = np.zeros_like(image_array)
+    for colour in unique_colours:
+        # Create binary mask for this class
+        mask = np.all(image_array == colour, axis=-1)
+        # Apply closing: erosion then dilation
+        for _ in range(kernel_size):
+            mask = ndimage.binary_erosion(mask, structure=kernel)
+        for _ in range(kernel_size):
+            mask = ndimage.binary_dilation(mask, structure=kernel)
+        # Assign pixels back
+        result[mask] = colour
+    # Fill any remaining pixels (from eroded areas) with nearest colour from result
+    unfilled = ~np.any(result != 0, axis=-1)
+    if np.any(unfilled):
+        # For unfilled pixels, use nearest palette colour again or copy from nearby
+        result[unfilled] = image_array[unfilled]
+    return result
+def rgb_image_to_index(image_array: np.ndarray, palette: np.ndarray) -> np.ndarray:
+    """
+    Map each RGB pixel in `image_array` to the index of the matching colour in `palette`.
+    Assumes pixels take values from `palette`.
+    """
+    h, w, _ = image_array.shape
+    palette_list = [tuple(map(int, c)) for c in palette.tolist()]
+    lookup = {c: i for i, c in enumerate(palette_list)}
+    flat = image_array.reshape(-1, 3)
+    idx = np.array([lookup[tuple(map(int, px))] for px in flat], dtype=np.uint16)
+    return idx.reshape(h, w)
+def process_file(
+    input_path: str,
+    output_path: str,
+    palette: np.ndarray,
+    kernel_size: int,
+    output_type: str = "rgb",
+):
+    try:
+        img = Image.open(input_path).convert("RGB")
+    except Exception as e:
+        print(f"Skipping {input_path}: cannot open image ({e})")
+        return
+    arr = np.array(img, dtype=np.uint8)
+    # Clean image using core function
+    cleaned = clean_image_palette(
+        arr, palette=palette, morph_kernel_size=kernel_size, output_type=output_type
+    )
+    # Ensure output directory exists
+    os.makedirs(os.path.dirname(output_path) or ".", exist_ok=True)
+    if output_type == "rgb":
+        Image.fromarray(cleaned).save(output_path)
+    elif output_type == "index":
+        Image.fromarray(cleaned.astype(np.uint8), mode="L").save(output_path)
+    else:
+        raise ValueError("output_type must be 'rgb' or 'index'")
+def process_directory(
+    input_dir: str,
+    output_dir: str,
+    palette: np.ndarray,
+    exts: List[str],
+    inplace: bool,
+    name_filter: str = "",
+    kernel_size: int = 0,
+    output_type: str = "rgb",
+):
+    exts = [e.lower().strip() for e in exts]
+    for root, dirs, files in os.walk(input_dir):
+        # Determine the corresponding output root
+        rel = os.path.relpath(root, input_dir)
+        out_root = os.path.join(output_dir, rel) if not inplace else root
+        os.makedirs(out_root, exist_ok=True)
+        for fname in files:
+            if not any(fname.lower().endswith(e) for e in exts):
+                continue
+            if name_filter and name_filter not in fname:
+                continue
+            in_path = os.path.join(root, fname)
+            out_path = os.path.join(out_root, fname)
+            process_file(in_path, out_path, palette, kernel_size, output_type)
+def clean_segmentation(
+    input_dir: str,
+    output_dir: str = None,
+    inplace: bool = False,
+    palette: np.ndarray = None,
+    exts: str = ".png,.jpg,.jpeg,.tiff,.bmp,.gif",
+    name_filter: str = "",
+    morph_kernel_size: int = 3,
+    output_type: str = "rgb",
+):
+    """
+    Clean segmentation images using palette-based color mapping.
+    Args:
+        input_dir (str): Path to input directory containing segmentation images.
+        output_dir (str, optional): Directory where cleaned images will be written. Required if not inplace.
+        inplace (bool): Overwrite input images in place.
+        palette (np.ndarray): Array of RGB triples (K, 3) uint8.
+        exts (str): Comma-separated list of allowed image extensions.
+        name_filter (str): Only process files whose name contains this substring.
+        morph_kernel_size (int): Size of morphological kernel for boundary cleaning.
+    """
+    if not inplace and output_dir is None:
+        raise ValueError("Either output_dir must be provided or inplace must be True")
+    if palette is None:
+        raise ValueError("palette must be provided")
+    exts_list = [e if e.startswith(".") else "." + e for e in exts.split(",")]
+    out_dir = output_dir if not inplace else input_dir
+    if not inplace:
+        os.makedirs(out_dir, exist_ok=True)
+    print(
+        f"Processing: input={input_dir} -> output={out_dir}, colours={len(palette)}, morph_kernel={morph_kernel_size}, output_type={output_type}"
+    )
+    process_directory(
+        input_dir,
+        out_dir,
+        palette,
+        exts_list,
+        inplace,
+        name_filter,
+        morph_kernel_size,
+        output_type,
+    )
+    print("Done.")

rgb_to_segmentation/cli.py ADDED Viewed

@@ -0,0 +1,180 @@
+import argparse
+import numpy as np
+from . import clean, nn, train, utils
+def main_clean():
+    parser = argparse.ArgumentParser(
+        description="Clean segmentation images using various methods."
+    )
+    parser.add_argument(
+        "--method",
+        type=str,
+        required=True,
+        choices=["palette", "nn"],
+        help="Cleaning method to use: 'palette' for color palette mapping, 'nn' for neural network (pixel_decoder or CNN).",
+    )
+    parser.add_argument(
+        "--input_dir",
+        type=str,
+        required=True,
+        help="Path to input directory containing images.",
+    )
+    parser.add_argument(
+        "--output_dir",
+        type=str,
+        required=False,
+        help="Directory where cleaned images will be written. Required if not inplace.",
+    )
+    parser.add_argument(
+        "--inplace",
+        action="store_true",
+        help="Overwrite input images in place.",
+    )
+    parser.add_argument(
+        "--exts",
+        type=str,
+        default=".png,.jpg,.jpeg,.tiff,.bmp,.gif",
+        help="Comma-separated list of allowed image extensions.",
+    )
+    parser.add_argument(
+        "--name_filter",
+        type=str,
+        default="",
+        help="Only process files whose name contains this substring.",
+    )
+    parser.add_argument(
+        "--output_type",
+        type=str,
+        choices=["rgb", "index"],
+        default="rgb",
+        help="Output format: 'rgb' colour image or 'index' mask.",
+    )
+    group = parser.add_mutually_exclusive_group(required=True)
+    group.add_argument(
+        "--colour_map",
+        type=str,
+        help="Semicolon-separated list of RGB triples.",
+    )
+    group.add_argument(
+        "--colour_map_file",
+        type=str,
+        help="Path to a file listing RGB triples.",
+    )
+    # Palette-specific args
+    parser.add_argument(
+        "--morph_kernel_size",
+        type=int,
+        default=3,
+        help="Size of morphological kernel for palette method.",
+    )
+    # NN-specific args
+    parser.add_argument(
+        "--model_path",
+        type=str,
+        help="Path to trained model for nn method.",
+    )
+    args = parser.parse_args()
+    if args.colour_map_file:
+        colours = utils.parse_colours_from_file(args.colour_map_file)
+    else:
+        colours = utils.parse_colours_from_string(args.colour_map)
+    if args.method == "palette":
+        palette = np.asarray(colours, dtype=np.uint8)
+        clean.clean_segmentation(
+            input_dir=args.input_dir,
+            output_dir=args.output_dir,
+            inplace=args.inplace,
+            palette=palette,
+            exts=args.exts,
+            name_filter=args.name_filter,
+            morph_kernel_size=args.morph_kernel_size,
+            output_type=args.output_type,
+        )
+    elif args.method == "nn":
+        if not args.model_path:
+            parser.error("--model_path required for nn method")
+        colour_map = {i: rgb for i, rgb in enumerate(colours)}
+        nn.run_inference(
+            input_dir=args.input_dir,
+            output_dir=args.output_dir,
+            inplace=args.inplace,
+            model_path=args.model_path,
+            colour_map=colour_map,
+            exts=args.exts,
+            name_filter=args.name_filter,
+            output_type=args.output_type,
+        )
+def main_train():
+    parser = argparse.ArgumentParser(
+        description="Train a neural network model for segmentation cleaning."
+    )
+    parser.add_argument(
+        "--image_dir",
+        type=str,
+        required=True,
+        help="Path to directory containing noisy images.",
+    )
+    parser.add_argument(
+        "--label_dir",
+        type=str,
+        required=True,
+        help="Path to directory containing target RGB labels.",
+    )
+    parser.add_argument(
+        "--output_dir",
+        type=str,
+        required=True,
+        help="Directory where model weights will be saved.",
+    )
+    parser.add_argument(
+        "--model_type",
+        type=str,
+        choices=["pixel_decoder", "cnn_decoder"],
+        default="pixel_decoder",
+        help="The type of model to train: 'pixel_decoder' for MLP or 'cnn_decoder' for CNN-based decoder.",
+    )
+    group = parser.add_mutually_exclusive_group(required=True)
+    group.add_argument(
+        "--colour_map",
+        type=str,
+        help="Semicolon-separated list of RGB triples.",
+    )
+    group.add_argument(
+        "--colour_map_file",
+        type=str,
+        help="Path to a file listing RGB triples.",
+    )
+    args = parser.parse_args()
+    if args.colour_map_file:
+        colours = utils.parse_colours_from_file(args.colour_map_file)
+    else:
+        colours = utils.parse_colours_from_string(args.colour_map)
+    colour_map = {i: rgb for i, rgb in enumerate(colours)}
+    train.train_model(
+        image_dir=args.image_dir,
+        label_dir=args.label_dir,
+        output_dir=args.output_dir,
+        colour_map=colour_map,
+        model_type=args.model_type,
+    )

rgb_to_segmentation/models/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+from .base_classifier import PixelClassifier
+from .pixelwise_classifier import PixelwiseClassifier
+from .cnn_decoder import CNNDecoder
+__all__ = ["PixelClassifier", "PixelwiseClassifier", "CNNDecoder"]