PyPI - pylocuszoom - Versions diffs - 0.1.0__py3-none-any.whl → 0.3.0__py3-none-any.whl - Mend

pylocuszoom 0.1.0py3-none-any.whl → 0.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

pylocuszoom/__init__.py +39 -20
pylocuszoom/backends/__init__.py +1 -5
pylocuszoom/backends/base.py +3 -1
pylocuszoom/backends/bokeh_backend.py +220 -51
pylocuszoom/backends/matplotlib_backend.py +35 -8
pylocuszoom/backends/plotly_backend.py +273 -32
pylocuszoom/colors.py +132 -0
pylocuszoom/eqtl.py +3 -2
pylocuszoom/finemapping.py +223 -0
pylocuszoom/gene_track.py +259 -38
pylocuszoom/labels.py +32 -33
pylocuszoom/ld.py +8 -7
pylocuszoom/plotter.py +615 -162
pylocuszoom/recombination.py +14 -14
pylocuszoom/utils.py +3 -1
{pylocuszoom-0.1.0.dist-info → pylocuszoom-0.3.0.dist-info}/METADATA +36 -27
pylocuszoom-0.3.0.dist-info/RECORD +21 -0
pylocuszoom-0.1.0.dist-info/RECORD +0 -20
{pylocuszoom-0.1.0.dist-info → pylocuszoom-0.3.0.dist-info}/WHEEL +0 -0
{pylocuszoom-0.1.0.dist-info → pylocuszoom-0.3.0.dist-info}/licenses/LICENSE.md +0 -0

pylocuszoom/plotter.py CHANGED Viewed

@@ -10,7 +10,7 @@ Supports multiple backends:
 """
 from pathlib import Path
-from typing import Any, List, Optional, Tuple, Union
+from typing import Any, List, Optional, Tuple
 import matplotlib.pyplot as plt
 import numpy as np
@@ -19,30 +19,43 @@ from matplotlib.axes import Axes
 from matplotlib.figure import Figure
 from matplotlib.lines import Line2D
 from matplotlib.patches import Patch
-from matplotlib.ticker import FuncFormatter, MaxNLocator
-from .backends import BackendType, PlotBackend, get_backend
+from .backends import BackendType, get_backend
 from .colors import (
+    EQTL_NEGATIVE_BINS,
+    EQTL_POSITIVE_BINS,
     LD_BINS,
     LEAD_SNP_COLOR,
+    PIP_LINE_COLOR,
+    get_credible_set_color,
+    get_eqtl_color,
     get_ld_bin,
     get_ld_color_palette,
 )
-from .gene_track import assign_gene_positions, plot_gene_track
+from .eqtl import validate_eqtl_df
+from .finemapping import (
+    get_credible_sets,
+    prepare_finemapping_for_plotting,
+)
+from .gene_track import (
+    assign_gene_positions,
+    plot_gene_track,
+    plot_gene_track_generic,
+)
 from .labels import add_snp_labels
 from .ld import calculate_ld, find_plink
 from .logging import enable_logging, logger
 from .recombination import (
+    RECOMB_COLOR,
     add_recombination_overlay,
-    download_dog_recombination_maps,
+    download_canine_recombination_maps,
     get_default_data_dir,
     get_recombination_rate_for_region,
 )
 from .utils import normalize_chrom, validate_genes_df, validate_gwas_df
-# Default significance threshold: 5e-8 for human, 5e-7 for dog
-DEFAULT_GENOMEWIDE_THRESHOLD = 5e-7
+# Default significance threshold: 5e-8 (genome-wide significance)
+DEFAULT_GENOMEWIDE_THRESHOLD = 5e-8
 DEFAULT_GENOMEWIDE_LINE = -np.log10(DEFAULT_GENOMEWIDE_THRESHOLD)
@@ -52,7 +65,7 @@ class LocusZoomPlotter:
     Creates LocusZoom-style regional plots with:
     - LD coloring based on R² with lead variant
     - Gene and exon tracks
-    - Recombination rate overlays (dog built-in, or user-provided)
+    - Recombination rate overlays (canine built-in, or user-provided)
     - Automatic SNP labeling
     Supports multiple rendering backends:
@@ -61,9 +74,9 @@ class LocusZoomPlotter:
     - bokeh: Interactive HTML for dashboards
     Args:
-        species: Species name ('dog', 'cat', or None for custom).
-            Dog has built-in recombination maps.
-        genome_build: Genome build for coordinate system. For dog:
+        species: Species name ('canine', 'feline', or None for custom).
+            Canine has built-in recombination maps.
+        genome_build: Genome build for coordinate system. For canine:
             "canfam3.1" (default) or "canfam4". If "canfam4", recombination
             maps are automatically lifted over from CanFam3.1.
         backend: Plotting backend ('matplotlib', 'plotly', or 'bokeh').
@@ -78,10 +91,10 @@ class LocusZoomPlotter:
     Example:
         >>> # Static plot (default)
-        >>> plotter = LocusZoomPlotter(species="dog")
+        >>> plotter = LocusZoomPlotter(species="canine")
         >>>
         >>> # Interactive plot with plotly
-        >>> plotter = LocusZoomPlotter(species="dog", backend="plotly")
+        >>> plotter = LocusZoomPlotter(species="canine", backend="plotly")
         >>>
         >>> fig = plotter.plot(
         ...     gwas_df,
@@ -96,7 +109,7 @@ class LocusZoomPlotter:
     def __init__(
         self,
-        species: str = "dog",
+        species: str = "canine",
         genome_build: Optional[str] = None,
         backend: BackendType = "matplotlib",
         plink_path: Optional[str] = None,
@@ -126,9 +139,9 @@ class LocusZoomPlotter:
     @staticmethod
     def _default_build(species: str) -> Optional[str]:
         """Get default genome build for species."""
-        if species == "dog":
+        if species == "canine":
             return "canfam3.1"
-        if species == "cat":
+        if species == "feline":
             return "felCat9"
         return None
@@ -137,7 +150,7 @@ class LocusZoomPlotter:
         Returns path to recombination map directory, or None if not available.
         """
-        if self.species == "dog":
+        if self.species == "canine":
             if self.recomb_data_dir:
                 return Path(self.recomb_data_dir)
             # Check if already downloaded
@@ -149,7 +162,7 @@ class LocusZoomPlotter:
                 return default_dir
             # Download
             try:
-                return download_dog_recombination_maps()
+                return download_canine_recombination_maps()
             except Exception as e:
                 logger.warning(f"Could not download recombination maps: {e}")
                 return None
@@ -249,20 +262,27 @@ class LocusZoomPlotter:
         # Calculate LD if reference file provided
         if ld_reference_file and lead_pos and ld_col is None:
-            lead_snp_row = df[df[pos_col] == lead_pos]
-            if not lead_snp_row.empty:
-                lead_snp_id = lead_snp_row[rs_col].iloc[0]
-                logger.debug(f"Calculating LD for lead SNP {lead_snp_id}")
-                ld_df = calculate_ld(
-                    bfile_path=ld_reference_file,
-                    lead_snp=lead_snp_id,
-                    window_kb=max((end - start) // 1000, 500),
-                    plink_path=self.plink_path,
-                    species=self.species,
+            # Check if rs_col exists before attempting LD calculation
+            if rs_col not in df.columns:
+                logger.warning(
+                    f"Cannot calculate LD: column '{rs_col}' not found in GWAS data. "
+                    f"Provide rs_col parameter or add SNP IDs to DataFrame."
                 )
-                if not ld_df.empty:
-                    df = df.merge(ld_df, left_on=rs_col, right_on="SNP", how="left")
-                    ld_col = "R2"
+            else:
+                lead_snp_row = df[df[pos_col] == lead_pos]
+                if not lead_snp_row.empty:
+                    lead_snp_id = lead_snp_row[rs_col].iloc[0]
+                    logger.debug(f"Calculating LD for lead SNP {lead_snp_id}")
+                    ld_df = calculate_ld(
+                        bfile_path=ld_reference_file,
+                        lead_snp=lead_snp_id,
+                        window_kb=max((end - start) // 1000, 500),
+                        plink_path=self.plink_path,
+                        species=self.species,
+                    )
+                    if not ld_df.empty:
+                        df = df.merge(ld_df, left_on=rs_col, right_on="SNP", how="left")
+                        ld_col = "R2"
         # Load recombination data if needed
         if show_recombination and recomb_df is None:
@@ -272,61 +292,70 @@ class LocusZoomPlotter:
         fig, ax, gene_ax = self._create_figure(genes_df, chrom, start, end, figsize)
         # Plot association data
-        self._plot_association(ax, df, pos_col, ld_col, lead_pos)
+        self._plot_association(ax, df, pos_col, ld_col, lead_pos, rs_col, p_col)
         # Add significance line
-        ax.axhline(
+        self._backend.axhline(
+            ax,
             y=self._genomewide_line,
-            color="grey",
+            color="red",
             linestyle="--",
             linewidth=1,
+            alpha=0.65,
             zorder=1,
         )
-        # Add SNP labels
+        # Add SNP labels (matplotlib only - interactive backends use hover tooltips)
         if snp_labels and rs_col in df.columns and label_top_n > 0 and not df.empty:
-            add_snp_labels(
-                ax,
-                df,
-                pos_col=pos_col,
-                neglog10p_col="neglog10p",
-                rs_col=rs_col,
-                label_top_n=label_top_n,
-                genes_df=genes_df,
-                chrom=chrom,
-            )
+            if self.backend_name == "matplotlib":
+                add_snp_labels(
+                    ax,
+                    df,
+                    pos_col=pos_col,
+                    neglog10p_col="neglog10p",
+                    rs_col=rs_col,
+                    label_top_n=label_top_n,
+                    genes_df=genes_df,
+                    chrom=chrom,
+                )
-        # Add recombination overlay
+        # Add recombination overlay (all backends)
         if recomb_df is not None and not recomb_df.empty:
-            add_recombination_overlay(ax, recomb_df, start, end)
+            if self.backend_name == "matplotlib":
+                add_recombination_overlay(ax, recomb_df, start, end)
+            else:
+                self._add_recombination_overlay_generic(ax, recomb_df, start, end)
         # Format axes
-        ax.set_ylabel(r"$-\log_{10}$ P")
-        ax.set_xlim(start, end)
-        ax.spines["top"].set_visible(False)
-        ax.spines["right"].set_visible(False)
+        self._backend.set_ylabel(ax, r"$-\log_{10}$ P")
+        self._backend.set_xlim(ax, start, end)
+        self._backend.hide_spines(ax, ["top", "right"])
-        # Add LD legend
+        # Add LD legend (all backends)
         if ld_col is not None and ld_col in df.columns:
-            self._add_ld_legend(ax)
+            if self.backend_name == "matplotlib":
+                self._add_ld_legend(ax)
+            else:
+                self._backend.add_ld_legend(ax, LD_BINS, LEAD_SNP_COLOR)
-        # Plot gene track
+        # Plot gene track (all backends)
         if genes_df is not None and gene_ax is not None:
-            plot_gene_track(gene_ax, genes_df, chrom, start, end, exons_df)
-            gene_ax.set_xlabel(f"Chromosome {chrom} (Mb)")
-            gene_ax.spines["top"].set_visible(False)
-            gene_ax.spines["right"].set_visible(False)
-            gene_ax.spines["left"].set_visible(False)
+            if self.backend_name == "matplotlib":
+                plot_gene_track(gene_ax, genes_df, chrom, start, end, exons_df)
+            else:
+                plot_gene_track_generic(
+                    gene_ax, self._backend, genes_df, chrom, start, end, exons_df
+                )
+            self._backend.set_xlabel(gene_ax, f"Chromosome {chrom} (Mb)")
+            self._backend.hide_spines(gene_ax, ["top", "right", "left"])
         else:
-            ax.set_xlabel(f"Chromosome {chrom} (Mb)")
+            self._backend.set_xlabel(ax, f"Chromosome {chrom} (Mb)")
         # Format x-axis with Mb labels
-        ax.xaxis.set_major_formatter(FuncFormatter(lambda x, _: f"{x / 1e6:.2f}"))
-        ax.xaxis.set_major_locator(MaxNLocator(nbins=6))
+        self._backend.format_xaxis_mb(ax)
         # Adjust layout
-        fig.subplots_adjust(left=0.08, right=0.95, top=0.95, bottom=0.1, hspace=0.08)
-        plt.ion()
+        self._backend.finalize_layout(fig, hspace=0.1)
         return fig
@@ -364,18 +393,20 @@ class LocusZoomPlotter:
             assoc_height = figsize[1] * 0.6
             total_height = assoc_height + gene_track_height
-            fig, axes = plt.subplots(
-                2,
-                1,
-                figsize=(figsize[0], total_height),
+            fig, axes = self._backend.create_figure(
+                n_panels=2,
                 height_ratios=[assoc_height, gene_track_height],
+                figsize=(figsize[0], total_height),
                 sharex=True,
-                gridspec_kw={"hspace": 0},
             )
             return fig, axes[0], axes[1]
         else:
-            fig, ax = plt.subplots(figsize=(figsize[0], figsize[1] * 0.75))
-            return fig, ax, None
+            fig, axes = self._backend.create_figure(
+                n_panels=1,
+                height_ratios=[1.0],
+                figsize=(figsize[0], figsize[1] * 0.75),
+            )
+            return fig, axes[0], None
     def _plot_association(
         self,
@@ -384,8 +415,28 @@ class LocusZoomPlotter:
         pos_col: str,
         ld_col: Optional[str],
         lead_pos: Optional[int],
+        rs_col: Optional[str] = None,
+        p_col: Optional[str] = None,
     ) -> None:
         """Plot association scatter with LD coloring."""
+        def _build_hover_data(subset_df: pd.DataFrame) -> Optional[pd.DataFrame]:
+            """Build hover data for interactive backends."""
+            hover_cols = {}
+            # RS ID first (will be bold in hover)
+            if rs_col and rs_col in subset_df.columns:
+                hover_cols["SNP"] = subset_df[rs_col].values
+            # Position
+            if pos_col in subset_df.columns:
+                hover_cols["Position"] = subset_df[pos_col].values
+            # P-value
+            if p_col and p_col in subset_df.columns:
+                hover_cols["P-value"] = subset_df[p_col].values
+            # LD
+            if ld_col and ld_col in subset_df.columns:
+                hover_cols["R²"] = subset_df[ld_col].values
+            return pd.DataFrame(hover_cols) if hover_cols else None
         # LD-based coloring
         if ld_col is not None and ld_col in df.columns:
             df["ld_bin"] = df[ld_col].apply(get_ld_bin)
@@ -394,40 +445,46 @@ class LocusZoomPlotter:
             palette = get_ld_color_palette()
             for bin_label in df["ld_bin"].unique():
                 bin_data = df[df["ld_bin"] == bin_label]
-                ax.scatter(
+                self._backend.scatter(
+                    ax,
                     bin_data[pos_col],
                     bin_data["neglog10p"],
-                    c=palette.get(bin_label, "#BEBEBE"),
-                    s=60,
+                    colors=palette.get(bin_label, "#BEBEBE"),
+                    sizes=60,
                     edgecolor="black",
                     linewidth=0.5,
                     zorder=2,
+                    hover_data=_build_hover_data(bin_data),
                 )
         else:
             # Default: grey points
-            ax.scatter(
+            self._backend.scatter(
+                ax,
                 df[pos_col],
                 df["neglog10p"],
-                c="#BEBEBE",
-                s=60,
+                colors="#BEBEBE",
+                sizes=60,
                 edgecolor="black",
                 linewidth=0.5,
                 zorder=2,
+                hover_data=_build_hover_data(df),
             )
-        # Highlight lead SNP
+        # Highlight lead SNP with larger, more prominent marker
         if lead_pos is not None:
             lead_snp = df[df[pos_col] == lead_pos]
             if not lead_snp.empty:
-                ax.scatter(
+                self._backend.scatter(
+                    ax,
                     lead_snp[pos_col],
                     lead_snp["neglog10p"],
-                    c=LEAD_SNP_COLOR,
-                    s=120,
+                    colors=LEAD_SNP_COLOR,
+                    sizes=120,  # Larger than regular points for visibility
                     marker="D",
-                    edgecolors="black",
-                    linewidths=1,
+                    edgecolor="black",
+                    linewidth=1.5,
                     zorder=10,
+                    hover_data=_build_hover_data(lead_snp),
                 )
     def _add_ld_legend(self, ax: Axes) -> None:
@@ -441,8 +498,8 @@ class LocusZoomPlotter:
                 color="w",
                 markerfacecolor=LEAD_SNP_COLOR,
                 markeredgecolor="black",
-                markersize=8,
-                label="Index SNP",
+                markersize=6,
+                label="Lead SNP",
             ),
         ]
@@ -457,7 +514,7 @@ class LocusZoomPlotter:
         ax.legend(
             handles=legend_elements,
-            loc="upper left",
+            loc="upper right",
             fontsize=9,
             frameon=True,
             framealpha=0.9,
@@ -468,6 +525,249 @@ class LocusZoomPlotter:
             labelspacing=0.4,
         )
+    def _add_recombination_overlay_generic(
+        self,
+        ax: Any,
+        recomb_df: pd.DataFrame,
+        start: int,
+        end: int,
+    ) -> None:
+        """Add recombination overlay for interactive backends (plotly/bokeh).
+        Creates a secondary y-axis with recombination rate line and fill.
+        """
+        # Filter to region
+        region_recomb = recomb_df[
+            (recomb_df["pos"] >= start) & (recomb_df["pos"] <= end)
+        ].copy()
+        if region_recomb.empty:
+            return
+        # Create secondary y-axis
+        yaxis_name = self._backend.create_twin_axis(ax)
+        # For plotly, yaxis_name is a tuple (fig, row, secondary_y)
+        # For bokeh, yaxis_name is just a string
+        if isinstance(yaxis_name, tuple):
+            _, _, secondary_y = yaxis_name
+        else:
+            secondary_y = yaxis_name
+        # Plot fill under curve
+        self._backend.fill_between_secondary(
+            ax,
+            region_recomb["pos"],
+            0,
+            region_recomb["rate"],
+            color=RECOMB_COLOR,
+            alpha=0.15,
+            yaxis_name=secondary_y,
+        )
+        # Plot recombination rate line
+        self._backend.line_secondary(
+            ax,
+            region_recomb["pos"],
+            region_recomb["rate"],
+            color=RECOMB_COLOR,
+            linewidth=1.5,
+            alpha=0.7,
+            yaxis_name=secondary_y,
+        )
+        # Set y-axis limits and label
+        max_rate = region_recomb["rate"].max()
+        self._backend.set_secondary_ylim(
+            ax, 0, max(max_rate * 1.2, 20), yaxis_name=secondary_y
+        )
+        self._backend.set_secondary_ylabel(
+            ax,
+            "Recombination rate (cM/Mb)",
+            color=RECOMB_COLOR,
+            fontsize=9,
+            yaxis_name=secondary_y,
+        )
+    def _add_eqtl_legend(self, ax: Axes) -> None:
+        """Add eQTL effect size legend to plot."""
+        legend_elements = []
+        # Positive effects (upward triangles)
+        for _, _, label, color in EQTL_POSITIVE_BINS:
+            legend_elements.append(
+                Line2D(
+                    [0],
+                    [0],
+                    marker="^",
+                    color="w",
+                    markerfacecolor=color,
+                    markeredgecolor="black",
+                    markersize=7,
+                    label=label,
+                )
+            )
+        # Negative effects (downward triangles)
+        for _, _, label, color in EQTL_NEGATIVE_BINS:
+            legend_elements.append(
+                Line2D(
+                    [0],
+                    [0],
+                    marker="v",
+                    color="w",
+                    markerfacecolor=color,
+                    markeredgecolor="black",
+                    markersize=7,
+                    label=label,
+                )
+            )
+        ax.legend(
+            handles=legend_elements,
+            loc="upper right",
+            fontsize=8,
+            frameon=True,
+            framealpha=0.9,
+            title="eQTL effect",
+            title_fontsize=9,
+            handlelength=1.2,
+            handleheight=1.0,
+            labelspacing=0.3,
+        )
+    def _plot_finemapping(
+        self,
+        ax: Axes,
+        df: pd.DataFrame,
+        pos_col: str = "pos",
+        pip_col: str = "pip",
+        cs_col: Optional[str] = "cs",
+        show_credible_sets: bool = True,
+        pip_threshold: float = 0.0,
+    ) -> None:
+        """Plot fine-mapping results (PIP line with credible set coloring).
+        Args:
+            ax: Matplotlib axes object.
+            df: Fine-mapping DataFrame with pos and pip columns.
+            pos_col: Column name for position.
+            pip_col: Column name for posterior inclusion probability.
+            cs_col: Column name for credible set assignment (optional).
+            show_credible_sets: Whether to color points by credible set.
+            pip_threshold: Minimum PIP to display as scatter point.
+        """
+        # Sort by position for line plotting
+        df = df.sort_values(pos_col)
+        # Plot PIP as line
+        self._backend.line(
+            ax,
+            df[pos_col],
+            df[pip_col],
+            color=PIP_LINE_COLOR,
+            linewidth=1.5,
+            alpha=0.8,
+            zorder=1,
+        )
+        # Check if credible sets are available
+        has_cs = cs_col is not None and cs_col in df.columns and show_credible_sets
+        credible_sets = get_credible_sets(df, cs_col) if has_cs else []
+        if credible_sets:
+            # Plot points colored by credible set
+            for cs_id in credible_sets:
+                cs_data = df[df[cs_col] == cs_id]
+                color = get_credible_set_color(cs_id)
+                self._backend.scatter(
+                    ax,
+                    cs_data[pos_col],
+                    cs_data[pip_col],
+                    colors=color,
+                    sizes=50,
+                    marker="o",
+                    edgecolor="black",
+                    linewidth=0.5,
+                    zorder=3,
+                    label=f"CS{cs_id}",
+                )
+            # Plot variants not in any credible set
+            non_cs_data = df[(df[cs_col].isna()) | (df[cs_col] == 0)]
+            if not non_cs_data.empty and pip_threshold > 0:
+                non_cs_data = non_cs_data[non_cs_data[pip_col] >= pip_threshold]
+                if not non_cs_data.empty:
+                    self._backend.scatter(
+                        ax,
+                        non_cs_data[pos_col],
+                        non_cs_data[pip_col],
+                        colors="#BEBEBE",
+                        sizes=30,
+                        marker="o",
+                        edgecolor="black",
+                        linewidth=0.3,
+                        zorder=2,
+                    )
+        else:
+            # No credible sets - show all points above threshold
+            if pip_threshold > 0:
+                high_pip = df[df[pip_col] >= pip_threshold]
+                if not high_pip.empty:
+                    self._backend.scatter(
+                        ax,
+                        high_pip[pos_col],
+                        high_pip[pip_col],
+                        colors=PIP_LINE_COLOR,
+                        sizes=50,
+                        marker="o",
+                        edgecolor="black",
+                        linewidth=0.5,
+                        zorder=3,
+                    )
+    def _add_finemapping_legend(
+        self,
+        ax: Axes,
+        credible_sets: List[int],
+    ) -> None:
+        """Add fine-mapping legend showing credible sets.
+        Args:
+            ax: Matplotlib axes object.
+            credible_sets: List of credible set IDs to include.
+        """
+        if not credible_sets:
+            return
+        legend_elements = []
+        for cs_id in credible_sets:
+            color = get_credible_set_color(cs_id)
+            legend_elements.append(
+                Line2D(
+                    [0],
+                    [0],
+                    marker="o",
+                    color="w",
+                    markerfacecolor=color,
+                    markeredgecolor="black",
+                    markersize=7,
+                    label=f"CS{cs_id}",
+                )
+            )
+        ax.legend(
+            handles=legend_elements,
+            loc="upper right",
+            fontsize=8,
+            frameon=True,
+            framealpha=0.9,
+            title="Credible sets",
+            title_fontsize=9,
+            handlelength=1.2,
+            handleheight=1.0,
+            labelspacing=0.3,
+        )
     def plot_stacked(
         self,
         gwas_dfs: List[pd.DataFrame],
@@ -478,10 +778,13 @@ class LocusZoomPlotter:
         panel_labels: Optional[List[str]] = None,
         ld_reference_file: Optional[str] = None,
         ld_reference_files: Optional[List[str]] = None,
+        ld_col: Optional[str] = None,
         genes_df: Optional[pd.DataFrame] = None,
         exons_df: Optional[pd.DataFrame] = None,
         eqtl_df: Optional[pd.DataFrame] = None,
         eqtl_gene: Optional[str] = None,
+        finemapping_df: Optional[pd.DataFrame] = None,
+        finemapping_cs_col: Optional[str] = "cs",
         recomb_df: Optional[pd.DataFrame] = None,
         show_recombination: bool = True,
         snp_labels: bool = True,
@@ -506,10 +809,15 @@ class LocusZoomPlotter:
             panel_labels: Labels for each panel (e.g., phenotype names).
             ld_reference_file: Single PLINK fileset for all panels.
             ld_reference_files: List of PLINK filesets (one per panel).
+            ld_col: Column name for pre-computed LD (R²) values in each DataFrame.
+                Use this if LD was calculated externally.
             genes_df: Gene annotations for bottom track.
             exons_df: Exon annotations for gene track.
             eqtl_df: eQTL data to display as additional panel.
             eqtl_gene: Filter eQTL data to this target gene.
+            finemapping_df: Fine-mapping/SuSiE results with pos and pip columns.
+                Displayed as PIP line with optional credible set coloring.
+            finemapping_cs_col: Column name for credible set assignment in finemapping_df.
             recomb_df: Pre-loaded recombination rate data.
             show_recombination: Whether to show recombination overlay.
             snp_labels: Whether to label top SNPs.
@@ -534,11 +842,30 @@ class LocusZoomPlotter:
         if n_gwas == 0:
             raise ValueError("At least one GWAS DataFrame required")
+        # Validate list lengths match
+        if lead_positions is not None and len(lead_positions) != n_gwas:
+            raise ValueError(
+                f"lead_positions length ({len(lead_positions)}) must match "
+                f"number of GWAS DataFrames ({n_gwas})"
+            )
+        if panel_labels is not None and len(panel_labels) != n_gwas:
+            raise ValueError(
+                f"panel_labels length ({len(panel_labels)}) must match "
+                f"number of GWAS DataFrames ({n_gwas})"
+            )
+        if ld_reference_files is not None and len(ld_reference_files) != n_gwas:
+            raise ValueError(
+                f"ld_reference_files length ({len(ld_reference_files)}) must match "
+                f"number of GWAS DataFrames ({n_gwas})"
+            )
         # Validate inputs
         for i, df in enumerate(gwas_dfs):
             validate_gwas_df(df, pos_col=pos_col, p_col=p_col)
         if genes_df is not None:
             validate_genes_df(genes_df)
+        if eqtl_df is not None:
+            validate_eqtl_df(eqtl_df)
         # Handle lead positions
         if lead_positions is None:
@@ -558,12 +885,16 @@ class LocusZoomPlotter:
         # Calculate panel layout
         panel_height = 2.5  # inches per GWAS panel
         eqtl_height = 2.0 if eqtl_df is not None else 0
+        finemapping_height = 1.5 if finemapping_df is not None else 0
         # Gene track height
         if genes_df is not None:
             chrom_str = normalize_chrom(chrom)
             region_genes = genes_df[
-                (genes_df["chr"].astype(str).str.replace("chr", "", regex=False) == chrom_str)
+                (
+                    genes_df["chr"].astype(str).str.replace("chr", "", regex=False)
+                    == chrom_str
+                )
                 & (genes_df["end"] >= start)
                 & (genes_df["start"] <= end)
             ]
@@ -579,8 +910,15 @@ class LocusZoomPlotter:
             gene_track_height = 0
         # Calculate total panels and heights
-        n_panels = n_gwas + (1 if eqtl_df is not None else 0) + (1 if genes_df is not None else 0)
+        n_panels = (
+            n_gwas
+            + (1 if finemapping_df is not None else 0)
+            + (1 if eqtl_df is not None else 0)
+            + (1 if genes_df is not None else 0)
+        )
         height_ratios = [panel_height] * n_gwas
+        if finemapping_df is not None:
+            height_ratios.append(finemapping_height)
         if eqtl_df is not None:
             height_ratios.append(eqtl_height)
         if genes_df is not None:
@@ -590,26 +928,21 @@ class LocusZoomPlotter:
         total_height = figsize[1] if figsize[1] else sum(height_ratios)
         actual_figsize = (figsize[0], total_height)
-        logger.debug(f"Creating stacked plot with {n_panels} panels for chr{chrom}:{start}-{end}")
-        # Prevent auto-display in interactive environments
-        plt.ioff()
+        logger.debug(
+            f"Creating stacked plot with {n_panels} panels for chr{chrom}:{start}-{end}"
+        )
         # Load recombination data if needed
         if show_recombination and recomb_df is None:
             recomb_df = self._get_recomb_for_region(chrom, start, end)
-        # Create figure
-        fig, axes = plt.subplots(
-            n_panels,
-            1,
-            figsize=actual_figsize,
+        # Create figure using backend
+        fig, axes = self._backend.create_figure(
+            n_panels=n_panels,
             height_ratios=height_ratios,
+            figsize=actual_figsize,
             sharex=True,
-            gridspec_kw={"hspace": 0.05},
         )
-        if n_panels == 1:
-            axes = [axes]
         # Plot each GWAS panel
         for i, (gwas_df, lead_pos) in enumerate(zip(gwas_dfs, lead_positions)):
@@ -617,9 +950,9 @@ class LocusZoomPlotter:
             df = gwas_df.copy()
             df["neglog10p"] = -np.log10(df[p_col].clip(lower=1e-300))
-            # Calculate LD if reference provided
-            ld_col = None
-            if ld_reference_files and ld_reference_files[i] and lead_pos:
+            # Use pre-computed LD or calculate from reference
+            panel_ld_col = ld_col
+            if ld_reference_files and ld_reference_files[i] and lead_pos and not ld_col:
                 lead_snp_row = df[df[pos_col] == lead_pos]
                 if not lead_snp_row.empty and rs_col in df.columns:
                     lead_snp_id = lead_snp_row[rs_col].iloc[0]
@@ -632,51 +965,135 @@ class LocusZoomPlotter:
                     )
                     if not ld_df.empty:
                         df = df.merge(ld_df, left_on=rs_col, right_on="SNP", how="left")
-                        ld_col = "R2"
+                        panel_ld_col = "R2"
             # Plot association
-            self._plot_association(ax, df, pos_col, ld_col, lead_pos)
+            self._plot_association(ax, df, pos_col, panel_ld_col, lead_pos, rs_col, p_col)
             # Add significance line
-            ax.axhline(y=self._genomewide_line, color="grey", linestyle="--", linewidth=1, zorder=1)
+            self._backend.axhline(
+                ax,
+                y=self._genomewide_line,
+                color="red",
+                linestyle="--",
+                linewidth=1,
+                alpha=0.65,
+                zorder=1,
+            )
-            # Add SNP labels
+            # Add SNP labels (matplotlib only - interactive backends use hover tooltips)
             if snp_labels and rs_col in df.columns and label_top_n > 0 and not df.empty:
-                add_snp_labels(
-                    ax, df, pos_col=pos_col, neglog10p_col="neglog10p",
-                    rs_col=rs_col, label_top_n=label_top_n, genes_df=genes_df, chrom=chrom,
-                )
+                if self.backend_name == "matplotlib":
+                    add_snp_labels(
+                        ax,
+                        df,
+                        pos_col=pos_col,
+                        neglog10p_col="neglog10p",
+                        rs_col=rs_col,
+                        label_top_n=label_top_n,
+                        genes_df=genes_df,
+                        chrom=chrom,
+                    )
-            # Add recombination overlay (only on first panel)
+            # Add recombination overlay (only on first panel, all backends)
             if i == 0 and recomb_df is not None and not recomb_df.empty:
-                add_recombination_overlay(ax, recomb_df, start, end)
+                if self.backend_name == "matplotlib":
+                    add_recombination_overlay(ax, recomb_df, start, end)
+                else:
+                    self._add_recombination_overlay_generic(ax, recomb_df, start, end)
             # Format axes
-            ax.set_ylabel(r"$-\log_{10}$ P")
-            ax.set_xlim(start, end)
-            ax.spines["top"].set_visible(False)
-            ax.spines["right"].set_visible(False)
+            self._backend.set_ylabel(ax, r"$-\log_{10}$ P")
+            self._backend.set_xlim(ax, start, end)
+            self._backend.hide_spines(ax, ["top", "right"])
             # Add panel label
             if panel_labels and i < len(panel_labels):
-                ax.annotate(
-                    panel_labels[i],
-                    xy=(0.02, 0.95),
-                    xycoords="axes fraction",
-                    fontsize=11,
-                    fontweight="bold",
-                    va="top",
-                    ha="left",
+                if self.backend_name == "matplotlib":
+                    ax.annotate(
+                        panel_labels[i],
+                        xy=(0.02, 0.95),
+                        xycoords="axes fraction",
+                        fontsize=11,
+                        fontweight="bold",
+                        va="top",
+                        ha="left",
+                    )
+                elif self.backend_name == "plotly":
+                    fig, row = ax
+                    fig.add_annotation(
+                        text=f"<b>{panel_labels[i]}</b>",
+                        xref=f"x{row} domain" if row > 1 else "x domain",
+                        yref=f"y{row} domain" if row > 1 else "y domain",
+                        x=0.02,
+                        y=0.95,
+                        showarrow=False,
+                        font=dict(size=11),
+                        xanchor="left",
+                        yanchor="top",
+                    )
+                elif self.backend_name == "bokeh":
+                    from bokeh.models import Label
+                    # Get y-axis range for positioning
+                    y_max = ax.y_range.end if ax.y_range.end else 10
+                    x_min = ax.x_range.start if ax.x_range.start else start
+                    label = Label(
+                        x=x_min + (end - start) * 0.02,
+                        y=y_max * 0.95,
+                        text=panel_labels[i],
+                        text_font_size="11pt",
+                        text_font_style="bold",
+                    )
+                    ax.add_layout(label)
+            # Add LD legend (only on first panel, all backends)
+            if i == 0 and panel_ld_col is not None and panel_ld_col in df.columns:
+                if self.backend_name == "matplotlib":
+                    self._add_ld_legend(ax)
+                else:
+                    self._backend.add_ld_legend(ax, LD_BINS, LEAD_SNP_COLOR)
+        # Track current panel index
+        panel_idx = n_gwas
+        # Plot fine-mapping panel if provided
+        if finemapping_df is not None:
+            ax = axes[panel_idx]
+            fm_data = prepare_finemapping_for_plotting(
+                finemapping_df,
+                pos_col="pos",
+                pip_col="pip",
+                chrom=chrom,
+                start=start,
+                end=end,
+            )
+            if not fm_data.empty:
+                self._plot_finemapping(
+                    ax,
+                    fm_data,
+                    pos_col="pos",
+                    pip_col="pip",
+                    cs_col=finemapping_cs_col,
+                    show_credible_sets=True,
+                    pip_threshold=0.01,
                 )
-            # Add LD legend (only on first panel)
-            if i == 0 and ld_col is not None and ld_col in df.columns:
-                self._add_ld_legend(ax)
+                # Add legend for credible sets
+                credible_sets = get_credible_sets(fm_data, finemapping_cs_col)
+                if credible_sets:
+                    self._add_finemapping_legend(ax, credible_sets)
+            self._backend.set_ylabel(ax, "PIP")
+            self._backend.set_ylim(ax, -0.05, 1.05)
+            self._backend.hide_spines(ax, ["top", "right"])
+            panel_idx += 1
         # Plot eQTL panel if provided
-        panel_idx = n_gwas
+        eqtl_panel_idx = panel_idx
         if eqtl_df is not None:
-            ax = axes[panel_idx]
+            ax = axes[eqtl_panel_idx]
             eqtl_data = eqtl_df.copy()
             # Filter by gene if specified
@@ -685,49 +1102,85 @@ class LocusZoomPlotter:
             # Filter by region
             if "pos" in eqtl_data.columns:
-                eqtl_data = eqtl_data[(eqtl_data["pos"] >= start) & (eqtl_data["pos"] <= end)]
+                eqtl_data = eqtl_data[
+                    (eqtl_data["pos"] >= start) & (eqtl_data["pos"] <= end)
+                ]
             if not eqtl_data.empty:
-                eqtl_data["neglog10p"] = -np.log10(eqtl_data["p_value"].clip(lower=1e-300))
-                # Plot as diamonds (different from GWAS circles)
-                ax.scatter(
-                    eqtl_data["pos"],
-                    eqtl_data["neglog10p"],
-                    c="#FF6B6B",
-                    s=60,
-                    marker="D",
-                    edgecolor="black",
-                    linewidth=0.5,
-                    zorder=2,
-                    label=f"eQTL ({eqtl_gene})" if eqtl_gene else "eQTL",
+                eqtl_data["neglog10p"] = -np.log10(
+                    eqtl_data["p_value"].clip(lower=1e-300)
                 )
-                ax.legend(loc="upper left", fontsize=9)
-            ax.set_ylabel(r"$-\log_{10}$ P (eQTL)")
-            ax.axhline(y=self._genomewide_line, color="grey", linestyle="--", linewidth=1)
-            ax.spines["top"].set_visible(False)
-            ax.spines["right"].set_visible(False)
+                # Check if effect_size column exists for directional coloring
+                has_effect = "effect_size" in eqtl_data.columns
+                if has_effect:
+                    # Plot triangles by effect direction with color by magnitude
+                    for _, row in eqtl_data.iterrows():
+                        effect = row["effect_size"]
+                        color = get_eqtl_color(effect)
+                        marker = "^" if effect >= 0 else "v"
+                        self._backend.scatter(
+                            ax,
+                            pd.Series([row["pos"]]),
+                            pd.Series([row["neglog10p"]]),
+                            colors=color,
+                            sizes=50,
+                            marker=marker,
+                            edgecolor="black",
+                            linewidth=0.5,
+                            zorder=2,
+                        )
+                    # Add eQTL effect legend
+                    self._add_eqtl_legend(ax)
+                else:
+                    # No effect sizes - plot as diamonds
+                    self._backend.scatter(
+                        ax,
+                        eqtl_data["pos"],
+                        eqtl_data["neglog10p"],
+                        colors="#FF6B6B",
+                        sizes=60,
+                        marker="D",
+                        edgecolor="black",
+                        linewidth=0.5,
+                        zorder=2,
+                        label=f"eQTL ({eqtl_gene})" if eqtl_gene else "eQTL",
+                    )
+                    ax.legend(loc="upper right", fontsize=9)
+            self._backend.set_ylabel(ax, r"$-\log_{10}$ P (eQTL)")
+            self._backend.axhline(
+                ax,
+                y=self._genomewide_line,
+                color="red",
+                linestyle="--",
+                linewidth=1,
+                alpha=0.65,
+            )
+            self._backend.hide_spines(ax, ["top", "right"])
             panel_idx += 1
-        # Plot gene track
+        # Plot gene track (all backends)
         if genes_df is not None:
             gene_ax = axes[panel_idx]
-            plot_gene_track(gene_ax, genes_df, chrom, start, end, exons_df)
-            gene_ax.set_xlabel(f"Chromosome {chrom} (Mb)")
-            gene_ax.spines["top"].set_visible(False)
-            gene_ax.spines["right"].set_visible(False)
-            gene_ax.spines["left"].set_visible(False)
+            if self.backend_name == "matplotlib":
+                plot_gene_track(gene_ax, genes_df, chrom, start, end, exons_df)
+            else:
+                plot_gene_track_generic(
+                    gene_ax, self._backend, genes_df, chrom, start, end, exons_df
+                )
+            self._backend.set_xlabel(gene_ax, f"Chromosome {chrom} (Mb)")
+            self._backend.hide_spines(gene_ax, ["top", "right", "left"])
         else:
             # Set x-label on bottom panel
-            axes[-1].set_xlabel(f"Chromosome {chrom} (Mb)")
+            self._backend.set_xlabel(axes[-1], f"Chromosome {chrom} (Mb)")
-        # Format x-axis
-        axes[0].xaxis.set_major_formatter(FuncFormatter(lambda x, _: f"{x / 1e6:.2f}"))
-        axes[0].xaxis.set_major_locator(MaxNLocator(nbins=6))
+        # Format x-axis (call for all axes - Plotly needs each subplot formatted)
+        for ax in axes:
+            self._backend.format_xaxis_mb(ax)
         # Adjust layout
-        fig.subplots_adjust(left=0.08, right=0.95, top=0.95, bottom=0.08, hspace=0.05)
-        plt.ion()
+        self._backend.finalize_layout(fig, hspace=0.1)
         return fig

pylocuszoom 0.1.0__py3-none-any.whl → 0.3.0__py3-none-any.whl

pylocuszoom 0.1.0py3-none-any.whl → 0.3.0py3-none-any.whl