PyPI - figrecipe - Versions diffs - 0.5.0__py3-none-any.whl - Mend

figrecipe 0.5.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

figrecipe/__init__.py +1090 -0
figrecipe/_recorder.py +435 -0
figrecipe/_reproducer.py +358 -0
figrecipe/_seaborn.py +305 -0
figrecipe/_serializer.py +227 -0
figrecipe/_signatures/__init__.py +7 -0
figrecipe/_signatures/_loader.py +186 -0
figrecipe/_utils/__init__.py +32 -0
figrecipe/_utils/_crop.py +261 -0
figrecipe/_utils/_diff.py +98 -0
figrecipe/_utils/_image_diff.py +204 -0
figrecipe/_utils/_numpy_io.py +204 -0
figrecipe/_utils/_units.py +200 -0
figrecipe/_validator.py +186 -0
figrecipe/_wrappers/__init__.py +8 -0
figrecipe/_wrappers/_axes.py +327 -0
figrecipe/_wrappers/_figure.py +227 -0
figrecipe/plt.py +12 -0
figrecipe/pyplot.py +264 -0
figrecipe/styles/__init__.py +50 -0
figrecipe/styles/_style_applier.py +412 -0
figrecipe/styles/_style_loader.py +450 -0
figrecipe-0.5.0.dist-info/METADATA +336 -0
figrecipe-0.5.0.dist-info/RECORD +26 -0
figrecipe-0.5.0.dist-info/WHEEL +4 -0
figrecipe-0.5.0.dist-info/licenses/LICENSE +661 -0

figrecipe/_validator.py ADDED Viewed

@@ -0,0 +1,186 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""Reproducibility validation for figrecipe recipes."""
+import tempfile
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Optional, Union
+import numpy as np
+@dataclass
+class ValidationResult:
+    """Result of reproducibility validation.
+    Attributes
+    ----------
+    valid : bool
+        True if reproduction is considered valid (MSE below threshold).
+    mse : float
+        Mean squared error between original and reproduced images.
+    psnr : float
+        Peak signal-to-noise ratio (higher is better, inf if identical).
+    max_diff : float
+        Maximum pixel difference (0-255 scale).
+    size_original : tuple
+        (height, width) of original image.
+    size_reproduced : tuple
+        (height, width) of reproduced image.
+    same_size : bool
+        True if dimensions match exactly.
+    file_size_diff : int
+        Difference in file sizes (bytes).
+    message : str
+        Human-readable summary.
+    """
+    valid: bool
+    mse: float
+    psnr: float
+    max_diff: float
+    size_original: tuple
+    size_reproduced: tuple
+    same_size: bool
+    file_size_diff: int
+    message: str
+    def __repr__(self) -> str:
+        status = "VALID" if self.valid else "INVALID"
+        return (
+            f"ValidationResult({status}, mse={self.mse:.2f}, "
+            f"size={'match' if self.same_size else 'differ'})"
+        )
+    def summary(self) -> str:
+        """Return detailed summary string."""
+        lines = [
+            f"Reproducibility Validation: {'PASSED' if self.valid else 'FAILED'}",
+            f"  Dimensions: {self.size_original} vs {self.size_reproduced} "
+            f"({'match' if self.same_size else 'DIFFER'})",
+            f"  Pixel MSE: {self.mse:.2f}",
+            f"  Max pixel diff: {self.max_diff:.1f}",
+            f"  PSNR: {self.psnr:.1f} dB" if not np.isinf(self.psnr) else "  PSNR: inf (identical)",
+            f"  File size diff: {self.file_size_diff:+d} bytes",
+        ]
+        if not self.valid:
+            lines.append(f"  Note: {self.message}")
+        return "\n".join(lines)
+def validate_recipe(
+    fig,
+    recipe_path: Union[str, Path],
+    mse_threshold: float = 100.0,
+    dpi: int = 150,
+) -> ValidationResult:
+    """Validate that a recipe can faithfully reproduce the original figure.
+    Parameters
+    ----------
+    fig : RecordingFigure
+        The original figure (with matplotlib figure accessible via fig.fig).
+    recipe_path : str or Path
+        Path to the saved recipe file.
+    mse_threshold : float
+        Maximum acceptable MSE for validation to pass (default: 100).
+        Lower values require closer matches.
+    dpi : int
+        DPI for comparison images (default: 150).
+    Returns
+    -------
+    ValidationResult
+        Detailed comparison results.
+    """
+    import matplotlib.pyplot as plt
+    from ._reproducer import reproduce
+    from ._utils._image_diff import compare_images
+    recipe_path = Path(recipe_path)
+    with tempfile.TemporaryDirectory() as tmpdir:
+        tmpdir = Path(tmpdir)
+        # Save original figure to temp image
+        original_path = tmpdir / "original.png"
+        fig.fig.savefig(original_path, dpi=dpi)
+        # Reproduce from recipe
+        reproduced_fig, _ = reproduce(recipe_path)
+        # Save reproduced figure
+        reproduced_path = tmpdir / "reproduced.png"
+        reproduced_fig.savefig(reproduced_path, dpi=dpi)
+        # Close reproduced figure to prevent double display in notebooks
+        plt.close(reproduced_fig)
+        # Compare images
+        diff = compare_images(original_path, reproduced_path)
+        # Determine validity
+        mse = diff["mse"]
+        if np.isnan(mse):
+            # Different sizes - invalid
+            valid = False
+            message = f"Image dimensions differ: {diff['size1']} vs {diff['size2']}"
+        elif mse > mse_threshold:
+            valid = False
+            message = f"MSE ({mse:.2f}) exceeds threshold ({mse_threshold})"
+        else:
+            valid = True
+            message = "Reproduction matches original within threshold"
+        return ValidationResult(
+            valid=valid,
+            mse=mse if not np.isnan(mse) else float("inf"),
+            psnr=diff["psnr"],
+            max_diff=diff["max_diff"] if not np.isnan(diff["max_diff"]) else float("inf"),
+            size_original=diff["size1"],
+            size_reproduced=diff["size2"],
+            same_size=diff["same_size"],
+            file_size_diff=diff["file_size2"] - diff["file_size1"],
+            message=message,
+        )
+def validate_on_save(
+    fig,
+    recipe_path: Union[str, Path],
+    mse_threshold: float = 100.0,
+    dpi: int = 150,
+    raise_on_failure: bool = False,
+) -> Optional[ValidationResult]:
+    """Validate recipe immediately after saving.
+    Parameters
+    ----------
+    fig : RecordingFigure
+        The original figure.
+    recipe_path : str or Path
+        Path where recipe was saved.
+    mse_threshold : float
+        Maximum acceptable MSE.
+    dpi : int
+        DPI for comparison.
+    raise_on_failure : bool
+        If True, raise ValueError when validation fails.
+    Returns
+    -------
+    ValidationResult
+        Validation results.
+    Raises
+    ------
+    ValueError
+        If raise_on_failure=True and validation fails.
+    """
+    result = validate_recipe(fig, recipe_path, mse_threshold, dpi)
+    if raise_on_failure and not result.valid:
+        raise ValueError(f"Recipe validation failed: {result.message}")
+    return result

figrecipe/_wrappers/__init__.py ADDED Viewed

@@ -0,0 +1,8 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""Matplotlib object wrappers for recording."""
+from ._axes import RecordingAxes
+from ._figure import RecordingFigure
+__all__ = ["RecordingAxes", "RecordingFigure"]

figrecipe/_wrappers/_axes.py ADDED Viewed

@@ -0,0 +1,327 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""Wrapped Axes that records all plotting calls."""
+from typing import Any, Dict, List, Optional, Tuple, TYPE_CHECKING
+import numpy as np
+import matplotlib.pyplot as plt
+from matplotlib.axes import Axes
+if TYPE_CHECKING:
+    from .._recorder import Recorder
+class RecordingAxes:
+    """Wrapper around matplotlib Axes that records all calls.
+    This wrapper intercepts calls to plotting methods and records them
+    for later reproduction.
+    Parameters
+    ----------
+    ax : matplotlib.axes.Axes
+        The underlying matplotlib axes.
+    recorder : Recorder
+        The recorder instance to log calls to.
+    position : tuple
+        (row, col) position in the figure grid.
+    Examples
+    --------
+    >>> import figrecipe as ps
+    >>> fig, ax = ps.subplots()
+    >>> ax.plot([1, 2, 3], [4, 5, 6], color='red', id='my_line')
+    >>> # The call is recorded automatically
+    """
+    def __init__(
+        self,
+        ax: Axes,
+        recorder: "Recorder",
+        position: Tuple[int, int] = (0, 0),
+    ):
+        self._ax = ax
+        self._recorder = recorder
+        self._position = position
+        self._track = True
+    @property
+    def ax(self) -> Axes:
+        """Get the underlying matplotlib axes."""
+        return self._ax
+    @property
+    def position(self) -> Tuple[int, int]:
+        """Get axes position in grid."""
+        return self._position
+    def __getattr__(self, name: str) -> Any:
+        """Intercept attribute access to wrap methods.
+        This is the core mechanism for recording calls.
+        """
+        attr = getattr(self._ax, name)
+        # If it's a plotting or decoration method, wrap it
+        if callable(attr) and name in (
+            self._recorder.PLOTTING_METHODS | self._recorder.DECORATION_METHODS
+        ):
+            return self._create_recording_wrapper(name, attr)
+        # For other methods/attributes, return as-is
+        return attr
+    def _create_recording_wrapper(self, method_name: str, method: callable):
+        """Create a wrapper function that records the call.
+        Parameters
+        ----------
+        method_name : str
+            Name of the method.
+        method : callable
+            The original method.
+        Returns
+        -------
+        callable
+            Wrapped method that records calls.
+        """
+        def wrapper(*args, id: Optional[str] = None, track: bool = True, **kwargs):
+            # Call the original method first (without our custom kwargs)
+            result = method(*args, **kwargs)
+            # Record the call if tracking is enabled
+            if self._track and track:
+                # Capture actual colors from result for plotting methods
+                # that use matplotlib's color cycle
+                recorded_kwargs = kwargs.copy()
+                if method_name in ('plot', 'scatter', 'bar', 'barh', 'step', 'fill_between'):
+                    if 'color' not in recorded_kwargs and 'c' not in recorded_kwargs:
+                        actual_color = self._extract_color_from_result(method_name, result)
+                        if actual_color is not None:
+                            recorded_kwargs['color'] = actual_color
+                self._recorder.record_call(
+                    ax_position=self._position,
+                    method_name=method_name,
+                    args=args,
+                    kwargs=recorded_kwargs,
+                    call_id=id,
+                )
+            return result
+        return wrapper
+    def _extract_color_from_result(self, method_name: str, result) -> Optional[str]:
+        """Extract actual color used from plot result.
+        Parameters
+        ----------
+        method_name : str
+            Name of the plotting method.
+        result : Any
+            Return value from the plotting method.
+        Returns
+        -------
+        str or None
+            The color used, or None if not extractable.
+        """
+        try:
+            if method_name == 'plot':
+                # plot() returns list of Line2D
+                if result and hasattr(result[0], 'get_color'):
+                    return result[0].get_color()
+            elif method_name == 'scatter':
+                # scatter() returns PathCollection
+                if hasattr(result, 'get_facecolor'):
+                    fc = result.get_facecolor()
+                    if len(fc) > 0:
+                        # Convert RGBA to hex
+                        import matplotlib.colors as mcolors
+                        return mcolors.to_hex(fc[0])
+            elif method_name in ('bar', 'barh'):
+                # bar() returns BarContainer
+                if hasattr(result, 'patches') and result.patches:
+                    fc = result.patches[0].get_facecolor()
+                    import matplotlib.colors as mcolors
+                    return mcolors.to_hex(fc)
+            elif method_name == 'step':
+                # step() returns list of Line2D
+                if result and hasattr(result[0], 'get_color'):
+                    return result[0].get_color()
+            elif method_name == 'fill_between':
+                # fill_between() returns PolyCollection
+                if hasattr(result, 'get_facecolor'):
+                    fc = result.get_facecolor()
+                    if len(fc) > 0:
+                        import matplotlib.colors as mcolors
+                        return mcolors.to_hex(fc[0])
+        except Exception:
+            pass
+        return None
+    def no_record(self):
+        """Context manager to temporarily disable recording.
+        Examples
+        --------
+        >>> with ax.no_record():
+        ...     ax.plot([1, 2, 3], [4, 5, 6])  # Not recorded
+        """
+        return _NoRecordContext(self)
+    def record_seaborn_call(
+        self,
+        func_name: str,
+        args: tuple,
+        kwargs: Dict[str, Any],
+        data_arrays: Dict[str, np.ndarray],
+        call_id: Optional[str] = None,
+    ) -> None:
+        """Record a seaborn plotting call.
+        Parameters
+        ----------
+        func_name : str
+            Name of the seaborn function (e.g., 'scatterplot').
+        args : tuple
+            Processed positional arguments.
+        kwargs : dict
+            Processed keyword arguments.
+        data_arrays : dict
+            Dictionary of array data extracted from DataFrame/arrays.
+        call_id : str, optional
+            Custom ID for this call.
+        """
+        if not self._track:
+            return
+        from .._utils._numpy_io import should_store_inline, to_serializable
+        # Generate call ID if not provided
+        if call_id is None:
+            call_id = self._recorder._generate_call_id(f"sns_{func_name}")
+        # Process data arrays into args format
+        processed_args = []
+        for i, arg in enumerate(args):
+            if arg == "__ARRAY__":
+                key = f"_arg_{i}"
+                if key in data_arrays:
+                    arr = data_arrays[key]
+                    if should_store_inline(arr):
+                        processed_args.append({
+                            "name": f"arg{i}",
+                            "data": to_serializable(arr),
+                            "dtype": str(arr.dtype),
+                        })
+                    else:
+                        processed_args.append({
+                            "name": f"arg{i}",
+                            "data": "__FILE__",
+                            "dtype": str(arr.dtype),
+                            "_array": arr,
+                        })
+            else:
+                processed_args.append({
+                    "name": f"arg{i}",
+                    "data": arg,
+                })
+        # Process DataFrame column data
+        for key, arr in data_arrays.items():
+            if key.startswith("_col_"):
+                param_name = key[5:]  # Remove "_col_" prefix
+                col_name = data_arrays.get(f"_colname_{param_name}", param_name)
+                if should_store_inline(arr):
+                    processed_args.append({
+                        "name": col_name,
+                        "param": param_name,
+                        "data": to_serializable(arr),
+                        "dtype": str(arr.dtype),
+                    })
+                else:
+                    processed_args.append({
+                        "name": col_name,
+                        "param": param_name,
+                        "data": "__FILE__",
+                        "dtype": str(arr.dtype),
+                        "_array": arr,
+                    })
+        # Process kwarg arrays
+        processed_kwargs = dict(kwargs)
+        for key, value in kwargs.items():
+            if value == "__ARRAY__":
+                arr_key = f"_kwarg_{key}"
+                if arr_key in data_arrays:
+                    arr = data_arrays[arr_key]
+                    if should_store_inline(arr):
+                        processed_kwargs[key] = to_serializable(arr)
+                    else:
+                        # Mark for file storage
+                        processed_kwargs[key] = "__FILE__"
+                        processed_kwargs[f"_array_{key}"] = arr
+        # Create call record
+        from .._recorder import CallRecord
+        record = CallRecord(
+            id=call_id,
+            function=f"sns.{func_name}",
+            args=processed_args,
+            kwargs=processed_kwargs,
+            ax_position=self._position,
+        )
+        # Add to axes record
+        ax_record = self._recorder.figure_record.get_or_create_axes(*self._position)
+        ax_record.add_call(record)
+    # Expose common properties directly
+    @property
+    def figure(self):
+        return self._ax.figure
+    @property
+    def xaxis(self):
+        return self._ax.xaxis
+    @property
+    def yaxis(self):
+        return self._ax.yaxis
+    # Methods that should not be recorded
+    def get_xlim(self):
+        return self._ax.get_xlim()
+    def get_ylim(self):
+        return self._ax.get_ylim()
+    def get_xlabel(self):
+        return self._ax.get_xlabel()
+    def get_ylabel(self):
+        return self._ax.get_ylabel()
+    def get_title(self):
+        return self._ax.get_title()
+class _NoRecordContext:
+    """Context manager to temporarily disable recording."""
+    def __init__(self, axes: RecordingAxes):
+        self._axes = axes
+        self._original_track = axes._track
+    def __enter__(self):
+        self._axes._track = False
+        return self
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        self._axes._track = self._original_track
+        return False