PyPI - figrecipe - Versions diffs - 0.5.0__py3-none-any.whl - Mend

figrecipe 0.5.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

figrecipe/__init__.py +1090 -0
figrecipe/_recorder.py +435 -0
figrecipe/_reproducer.py +358 -0
figrecipe/_seaborn.py +305 -0
figrecipe/_serializer.py +227 -0
figrecipe/_signatures/__init__.py +7 -0
figrecipe/_signatures/_loader.py +186 -0
figrecipe/_utils/__init__.py +32 -0
figrecipe/_utils/_crop.py +261 -0
figrecipe/_utils/_diff.py +98 -0
figrecipe/_utils/_image_diff.py +204 -0
figrecipe/_utils/_numpy_io.py +204 -0
figrecipe/_utils/_units.py +200 -0
figrecipe/_validator.py +186 -0
figrecipe/_wrappers/__init__.py +8 -0
figrecipe/_wrappers/_axes.py +327 -0
figrecipe/_wrappers/_figure.py +227 -0
figrecipe/plt.py +12 -0
figrecipe/pyplot.py +264 -0
figrecipe/styles/__init__.py +50 -0
figrecipe/styles/_style_applier.py +412 -0
figrecipe/styles/_style_loader.py +450 -0
figrecipe-0.5.0.dist-info/METADATA +336 -0
figrecipe-0.5.0.dist-info/RECORD +26 -0
figrecipe-0.5.0.dist-info/WHEEL +4 -0
figrecipe-0.5.0.dist-info/licenses/LICENSE +661 -0

figrecipe/_reproducer.py ADDED Viewed

@@ -0,0 +1,358 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""Reproduce figures from recipe files."""
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Tuple, Union
+import matplotlib.pyplot as plt
+import numpy as np
+from matplotlib.axes import Axes
+from matplotlib.figure import Figure
+from ._recorder import FigureRecord, CallRecord
+from ._serializer import load_recipe
+def reproduce(
+    path: Union[str, Path],
+    calls: Optional[List[str]] = None,
+    skip_decorations: bool = False,
+) -> Tuple[Figure, Union[Axes, List[Axes]]]:
+    """Reproduce a figure from a recipe file.
+    Parameters
+    ----------
+    path : str or Path
+        Path to .yaml recipe file.
+    calls : list of str, optional
+        If provided, only reproduce these specific call IDs.
+    skip_decorations : bool
+        If True, skip decoration calls (labels, legends, etc.).
+    Returns
+    -------
+    fig : matplotlib.figure.Figure
+        Reproduced figure.
+    axes : Axes or list of Axes
+        Reproduced axes (single if 1x1, otherwise list).
+    Examples
+    --------
+    >>> import figrecipe as ps
+    >>> fig, ax = ps.reproduce("experiment_001.yaml")
+    >>> plt.show()
+    """
+    record = load_recipe(path)
+    return reproduce_from_record(
+        record,
+        calls=calls,
+        skip_decorations=skip_decorations,
+    )
+def reproduce_from_record(
+    record: FigureRecord,
+    calls: Optional[List[str]] = None,
+    skip_decorations: bool = False,
+) -> Tuple[Figure, Union[Axes, List[Axes]]]:
+    """Reproduce a figure from a FigureRecord.
+    Parameters
+    ----------
+    record : FigureRecord
+        The figure record to reproduce.
+    calls : list of str, optional
+        If provided, only reproduce these specific call IDs.
+    skip_decorations : bool
+        If True, skip decoration calls.
+    Returns
+    -------
+    fig : matplotlib.figure.Figure
+        Reproduced figure.
+    axes : Axes or list of Axes
+        Reproduced axes.
+    """
+    # Determine grid size from axes positions
+    max_row = 0
+    max_col = 0
+    for ax_key in record.axes.keys():
+        parts = ax_key.split("_")
+        if len(parts) >= 3:
+            max_row = max(max_row, int(parts[1]))
+            max_col = max(max_col, int(parts[2]))
+    nrows = max_row + 1
+    ncols = max_col + 1
+    # Create figure
+    fig, mpl_axes = plt.subplots(
+        nrows,
+        ncols,
+        figsize=record.figsize,
+        dpi=record.dpi,
+        constrained_layout=record.constrained_layout,
+    )
+    # Apply layout if recorded
+    if record.layout is not None:
+        fig.subplots_adjust(**record.layout)
+    # Ensure axes is 2D array
+    if nrows == 1 and ncols == 1:
+        axes_2d = np.array([[mpl_axes]])
+    else:
+        axes_2d = np.atleast_2d(mpl_axes)
+        if nrows == 1:
+            axes_2d = axes_2d.reshape(1, -1)
+        elif ncols == 1:
+            axes_2d = axes_2d.reshape(-1, 1)
+    # Apply style BEFORE replaying calls (to match original order:
+    # style is applied during subplots(), then user creates plots/decorations)
+    if record.style is not None:
+        from .styles import apply_style_mm
+        for row in range(nrows):
+            for col in range(ncols):
+                apply_style_mm(axes_2d[row, col], record.style)
+    # Replay calls on each axes
+    for ax_key, ax_record in record.axes.items():
+        parts = ax_key.split("_")
+        if len(parts) >= 3:
+            row, col = int(parts[1]), int(parts[2])
+        else:
+            row, col = 0, 0
+        ax = axes_2d[row, col]
+        # Replay plotting calls
+        for call in ax_record.calls:
+            if calls is not None and call.id not in calls:
+                continue
+            _replay_call(ax, call)
+        # Replay decorations
+        if not skip_decorations:
+            for call in ax_record.decorations:
+                if calls is not None and call.id not in calls:
+                    continue
+                _replay_call(ax, call)
+    # Return in appropriate format
+    if nrows == 1 and ncols == 1:
+        return fig, axes_2d[0, 0]
+    elif nrows == 1:
+        return fig, list(axes_2d[0])
+    elif ncols == 1:
+        return fig, list(axes_2d[:, 0])
+    else:
+        return fig, axes_2d.tolist()
+def _replay_call(ax: Axes, call: CallRecord) -> Any:
+    """Replay a single call on an axes.
+    Parameters
+    ----------
+    ax : Axes
+        The matplotlib axes.
+    call : CallRecord
+        The call to replay.
+    Returns
+    -------
+    Any
+        Result of the matplotlib call.
+    """
+    method_name = call.function
+    # Check if it's a seaborn call
+    if method_name.startswith("sns."):
+        return _replay_seaborn_call(ax, call)
+    method = getattr(ax, method_name, None)
+    if method is None:
+        # Method not found, skip
+        return None
+    # Reconstruct args
+    args = []
+    for arg_data in call.args:
+        value = _reconstruct_value(arg_data)
+        args.append(value)
+    # Get kwargs
+    kwargs = call.kwargs.copy()
+    # Call the method
+    try:
+        return method(*args, **kwargs)
+    except Exception as e:
+        # Log warning but continue
+        import warnings
+        warnings.warn(f"Failed to replay {method_name}: {e}")
+        return None
+def _replay_seaborn_call(ax: Axes, call: CallRecord) -> Any:
+    """Replay a seaborn call on an axes.
+    Parameters
+    ----------
+    ax : Axes
+        The matplotlib axes.
+    call : CallRecord
+        The seaborn call to replay.
+    Returns
+    -------
+    Any
+        Result of the seaborn call.
+    """
+    try:
+        import seaborn as sns
+        import pandas as pd
+    except ImportError:
+        import warnings
+        warnings.warn("seaborn/pandas required to replay seaborn calls")
+        return None
+    # Get the seaborn function name (remove "sns." prefix)
+    func_name = call.function[4:]  # Remove "sns."
+    func = getattr(sns, func_name, None)
+    if func is None:
+        import warnings
+        warnings.warn(f"Seaborn function {func_name} not found")
+        return None
+    # Reconstruct data from args
+    # Args contain column data with "param" field indicating the parameter name
+    data_dict = {}
+    param_mapping = {}  # Maps param name to column name
+    for arg_data in call.args:
+        param = arg_data.get("param")
+        name = arg_data.get("name")
+        value = _reconstruct_value(arg_data)
+        if param is not None:
+            # This is a DataFrame column
+            col_name = name if name else param
+            data_dict[col_name] = value
+            param_mapping[param] = col_name
+    # Build kwargs
+    kwargs = call.kwargs.copy()
+    # Remove internal keys
+    internal_keys = [k for k in kwargs.keys() if k.startswith("_")]
+    for key in internal_keys:
+        kwargs.pop(key, None)
+    # If we have data columns, create a DataFrame
+    if data_dict:
+        df = pd.DataFrame(data_dict)
+        kwargs["data"] = df
+        # Update column name references in kwargs
+        for param, col_name in param_mapping.items():
+            if param in ["x", "y", "hue", "size", "style", "row", "col"]:
+                kwargs[param] = col_name
+    # Add the axes
+    kwargs["ax"] = ax
+    # Convert certain list parameters back to tuples (YAML serializes tuples as lists)
+    # 'sizes' in seaborn expects a tuple (min, max) for range, not a list
+    if "sizes" in kwargs and isinstance(kwargs["sizes"], list):
+        kwargs["sizes"] = tuple(kwargs["sizes"])
+    # Call the seaborn function
+    try:
+        return func(**kwargs)
+    except Exception as e:
+        import warnings
+        warnings.warn(f"Failed to replay sns.{func_name}: {e}")
+        return None
+def _reconstruct_value(arg_data: Dict[str, Any]) -> Any:
+    """Reconstruct a value from serialized arg data.
+    Parameters
+    ----------
+    arg_data : dict
+        Serialized argument data.
+    Returns
+    -------
+    Any
+        Reconstructed value.
+    """
+    # Check if we have a pre-loaded array
+    if "_loaded_array" in arg_data:
+        return arg_data["_loaded_array"]
+    data = arg_data.get("data")
+    # If data is a list, convert to numpy array
+    if isinstance(data, list):
+        dtype = arg_data.get("dtype")
+        try:
+            return np.array(data, dtype=dtype if dtype else None)
+        except (TypeError, ValueError):
+            return np.array(data)
+    return data
+def get_recipe_info(path: Union[str, Path]) -> Dict[str, Any]:
+    """Get information about a recipe without reproducing.
+    Parameters
+    ----------
+    path : str or Path
+        Path to .yaml recipe file.
+    Returns
+    -------
+    dict
+        Recipe information including:
+        - id: Figure ID
+        - created: Creation timestamp
+        - matplotlib_version: Version used
+        - figsize: Figure size
+        - n_axes: Number of axes
+        - calls: List of call IDs
+    """
+    record = load_recipe(path)
+    all_calls = []
+    for ax_record in record.axes.values():
+        for call in ax_record.calls:
+            all_calls.append({
+                "id": call.id,
+                "function": call.function,
+                "n_args": len(call.args),
+                "kwargs": list(call.kwargs.keys()),
+            })
+        for call in ax_record.decorations:
+            all_calls.append({
+                "id": call.id,
+                "function": call.function,
+                "type": "decoration",
+            })
+    return {
+        "id": record.id,
+        "created": record.created,
+        "matplotlib_version": record.matplotlib_version,
+        "figsize": record.figsize,
+        "dpi": record.dpi,
+        "n_axes": len(record.axes),
+        "calls": all_calls,
+    }

figrecipe/_seaborn.py ADDED Viewed

@@ -0,0 +1,305 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""Seaborn wrapper for figrecipe recording."""
+from functools import wraps
+from typing import Any, Callable, Dict, List, Optional, TYPE_CHECKING
+import numpy as np
+try:
+    import seaborn as sns
+    import pandas as pd
+    HAS_SEABORN = True
+except ImportError:
+    HAS_SEABORN = False
+    sns = None
+    pd = None
+if TYPE_CHECKING:
+    from ._wrappers._axes import RecordingAxes
+# Seaborn axes-level plotting functions to wrap
+SEABORN_PLOT_FUNCTIONS = {
+    # Relational
+    "scatterplot",
+    "lineplot",
+    # Distribution
+    "histplot",
+    "kdeplot",
+    "ecdfplot",
+    "rugplot",
+    # Categorical
+    "stripplot",
+    "swarmplot",
+    "boxplot",
+    "violinplot",
+    "boxenplot",
+    "pointplot",
+    "barplot",
+    "countplot",
+    # Regression
+    "regplot",
+    "residplot",
+    # Matrix
+    "heatmap",
+    "clustermap",
+}
+def _check_seaborn():
+    """Check if seaborn is available."""
+    if not HAS_SEABORN:
+        raise ImportError(
+            "seaborn is required for this functionality. "
+            "Install it with: pip install seaborn"
+        )
+def _extract_data_from_dataframe(
+    data: Optional["pd.DataFrame"],
+    x: Optional[str] = None,
+    y: Optional[str] = None,
+    hue: Optional[str] = None,
+    size: Optional[str] = None,
+    style: Optional[str] = None,
+    row: Optional[str] = None,
+    col: Optional[str] = None,
+    weight: Optional[str] = None,
+    weights: Optional[str] = None,
+) -> Dict[str, Any]:
+    """Extract relevant columns from DataFrame for serialization.
+    Parameters
+    ----------
+    data : DataFrame or None
+        The data source.
+    x, y, hue, size, style, row, col, weight, weights : str or None
+        Column names to extract.
+    Returns
+    -------
+    dict
+        Extracted data with column arrays.
+    """
+    if data is None:
+        return {}
+    extracted = {}
+    columns_to_extract = []
+    # All column parameters
+    param_values = [
+        ("x", x), ("y", y), ("hue", hue), ("size", size), ("style", style),
+        ("row", row), ("col", col), ("weight", weight), ("weights", weights),
+    ]
+    for param_name, col_name in param_values:
+        if col_name is not None and isinstance(col_name, str):
+            if col_name in data.columns:
+                columns_to_extract.append((param_name, col_name))
+    # Extract columns
+    for param_name, col_name in columns_to_extract:
+        arr = data[col_name].values
+        extracted[f"_col_{param_name}"] = arr
+        extracted[f"_colname_{param_name}"] = col_name
+    return extracted
+def _serialize_seaborn_args(
+    func_name: str,
+    args: tuple,
+    kwargs: Dict[str, Any],
+) -> tuple:
+    """Serialize seaborn function arguments.
+    Parameters
+    ----------
+    func_name : str
+        Name of seaborn function.
+    args : tuple
+        Positional arguments.
+    kwargs : dict
+        Keyword arguments.
+    Returns
+    -------
+    tuple
+        (processed_args, processed_kwargs, data_arrays)
+    """
+    processed_kwargs = {}
+    data_arrays = {}
+    # Handle 'data' parameter (DataFrame)
+    data = kwargs.get("data")
+    if data is not None and hasattr(data, "columns"):
+        # Extract column data
+        extracted = _extract_data_from_dataframe(
+            data,
+            x=kwargs.get("x"),
+            y=kwargs.get("y"),
+            hue=kwargs.get("hue"),
+            size=kwargs.get("size"),
+            style=kwargs.get("style"),
+            row=kwargs.get("row"),
+            col=kwargs.get("col"),
+            weight=kwargs.get("weight"),
+            weights=kwargs.get("weights"),
+        )
+        data_arrays.update(extracted)
+        # Store column names (not the DataFrame itself)
+        processed_kwargs["_has_dataframe"] = True
+    # Process other kwargs
+    for key, value in kwargs.items():
+        if key == "data":
+            continue  # Handled above
+        elif key == "ax":
+            continue  # Will be handled separately
+        elif isinstance(value, np.ndarray):
+            data_arrays[f"_kwarg_{key}"] = value
+            processed_kwargs[key] = "__ARRAY__"
+        elif hasattr(value, "values"):  # pandas Series
+            data_arrays[f"_kwarg_{key}"] = np.asarray(value)
+            processed_kwargs[key] = "__ARRAY__"
+        elif _is_serializable(value):
+            processed_kwargs[key] = value
+        else:
+            try:
+                processed_kwargs[key] = str(value)
+            except Exception:
+                pass
+    # Process positional args (less common for seaborn)
+    processed_args = []
+    for i, arg in enumerate(args):
+        if isinstance(arg, np.ndarray):
+            data_arrays[f"_arg_{i}"] = arg
+            processed_args.append("__ARRAY__")
+        elif hasattr(arg, "values"):
+            data_arrays[f"_arg_{i}"] = np.asarray(arg)
+            processed_args.append("__ARRAY__")
+        elif _is_serializable(arg):
+            processed_args.append(arg)
+        else:
+            processed_args.append(str(arg))
+    return tuple(processed_args), processed_kwargs, data_arrays
+def _is_serializable(value: Any) -> bool:
+    """Check if value is directly serializable."""
+    if value is None:
+        return True
+    if isinstance(value, (bool, int, float, str)):
+        return True
+    if isinstance(value, (list, tuple)):
+        return all(_is_serializable(v) for v in value)
+    if isinstance(value, dict):
+        return all(
+            isinstance(k, str) and _is_serializable(v)
+            for k, v in value.items()
+        )
+    return False
+class SeabornRecorder:
+    """Wrapper that records seaborn plotting calls."""
+    def __init__(self):
+        _check_seaborn()
+    def __getattr__(self, name: str) -> Callable:
+        """Get a wrapped seaborn function."""
+        if name.startswith("_"):
+            raise AttributeError(name)
+        if not hasattr(sns, name):
+            raise AttributeError(f"seaborn has no attribute '{name}'")
+        original_func = getattr(sns, name)
+        if name not in SEABORN_PLOT_FUNCTIONS:
+            # Return unwrapped for non-plotting functions
+            return original_func
+        @wraps(original_func)
+        def wrapped(*args, **kwargs):
+            return self._record_and_call(name, original_func, args, kwargs)
+        return wrapped
+    def _record_and_call(
+        self,
+        func_name: str,
+        func: Callable,
+        args: tuple,
+        kwargs: Dict[str, Any],
+    ) -> Any:
+        """Record the seaborn call and execute it.
+        Parameters
+        ----------
+        func_name : str
+            Name of the seaborn function.
+        func : callable
+            The actual seaborn function.
+        args : tuple
+            Positional arguments.
+        kwargs : dict
+            Keyword arguments.
+        Returns
+        -------
+        Any
+            Result from the seaborn function.
+        """
+        from ._wrappers._axes import RecordingAxes
+        # Extract custom ID if provided
+        call_id = kwargs.pop("id", None)
+        # Get the axes
+        ax = kwargs.get("ax")
+        # If we have a RecordingAxes, disable recording during seaborn call
+        # to prevent recording the underlying matplotlib calls (e.g., scatter)
+        # that seaborn makes internally. We only want to record the seaborn call.
+        if isinstance(ax, RecordingAxes):
+            with ax.no_record():
+                result = func(*args, **kwargs)
+            # Serialize arguments
+            proc_args, proc_kwargs, data_arrays = _serialize_seaborn_args(
+                func_name, args, kwargs
+            )
+            # Record as a seaborn call (outside no_record context)
+            ax.record_seaborn_call(
+                func_name=func_name,
+                args=proc_args,
+                kwargs=proc_kwargs,
+                data_arrays=data_arrays,
+                call_id=call_id,
+            )
+        else:
+            # No recording axes, just call the function
+            result = func(*args, **kwargs)
+        return result
+# Module-level instance for convenient access
+_recorder: Optional[SeabornRecorder] = None
+def get_seaborn_recorder() -> SeabornRecorder:
+    """Get or create the seaborn recorder instance."""
+    global _recorder
+    if _recorder is None:
+        _recorder = SeabornRecorder()
+    return _recorder