PyPI - pylocuszoom - Versions diffs - 0.1.0__py3-none-any.whl → 0.3.0__py3-none-any.whl - Mend

pylocuszoom 0.1.0py3-none-any.whl → 0.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

pylocuszoom/__init__.py +39 -20
pylocuszoom/backends/__init__.py +1 -5
pylocuszoom/backends/base.py +3 -1
pylocuszoom/backends/bokeh_backend.py +220 -51
pylocuszoom/backends/matplotlib_backend.py +35 -8
pylocuszoom/backends/plotly_backend.py +273 -32
pylocuszoom/colors.py +132 -0
pylocuszoom/eqtl.py +3 -2
pylocuszoom/finemapping.py +223 -0
pylocuszoom/gene_track.py +259 -38
pylocuszoom/labels.py +32 -33
pylocuszoom/ld.py +8 -7
pylocuszoom/plotter.py +615 -162
pylocuszoom/recombination.py +14 -14
pylocuszoom/utils.py +3 -1
{pylocuszoom-0.1.0.dist-info → pylocuszoom-0.3.0.dist-info}/METADATA +36 -27
pylocuszoom-0.3.0.dist-info/RECORD +21 -0
pylocuszoom-0.1.0.dist-info/RECORD +0 -20
{pylocuszoom-0.1.0.dist-info → pylocuszoom-0.3.0.dist-info}/WHEEL +0 -0
{pylocuszoom-0.1.0.dist-info → pylocuszoom-0.3.0.dist-info}/licenses/LICENSE.md +0 -0

pylocuszoom/labels.py CHANGED Viewed

@@ -2,18 +2,15 @@
 Provides automatic labeling of top significant SNPs with:
 - SNP ID (rs number)
-- Nearest gene name (if gene annotations provided)
 - Automatic overlap avoidance (if adjustText installed)
 """
-from typing import List, Optional, Union
+from typing import Any, List, Optional, Union
 import pandas as pd
 from matplotlib.axes import Axes
 from matplotlib.text import Annotation
-from .gene_track import get_nearest_gene
 def add_snp_labels(
     ax: Axes,
@@ -25,11 +22,11 @@ def add_snp_labels(
     genes_df: Optional[pd.DataFrame] = None,
     chrom: Optional[Union[int, str]] = None,
     max_label_length: int = 15,
+    **kwargs: Any,
 ) -> List[Annotation]:
     """Add text labels to top SNPs in the regional plot.
-    Labels the most significant SNPs with either their SNP ID
-    or the nearest gene name (if genes_df provided).
+    Labels the most significant SNPs with their SNP ID (rs number).
     Args:
         ax: Matplotlib axes object.
@@ -39,10 +36,8 @@ def add_snp_labels(
         neglog10p_col: Column name for -log10(p-value).
         rs_col: Column name for SNP ID.
         label_top_n: Number of top SNPs to label.
-        genes_df: Optional gene annotations for gene-based labels.
-            If provided with chrom, labels will show nearest gene name
-            instead of SNP ID.
-        chrom: Chromosome number. Required if genes_df is provided.
+        genes_df: Unused, kept for backward compatibility.
+        chrom: Unused, kept for backward compatibility.
         max_label_length: Maximum label length before truncation.
     Returns:
@@ -53,6 +48,8 @@ def add_snp_labels(
         >>> # ... plot your data ...
         >>> texts = add_snp_labels(ax, df, label_top_n=5)
     """
+    # genes_df and chrom are unused but kept for backward compatibility
+    del genes_df, chrom, kwargs
     if neglog10p_col not in df.columns:
         raise ValueError(
             f"Column '{neglog10p_col}' not found in DataFrame. "
@@ -63,33 +60,34 @@ def add_snp_labels(
     top_snps = df.nlargest(label_top_n, neglog10p_col)
     texts = []
+    used_labels = set()  # Track used labels to avoid duplicates
     for _, snp in top_snps.iterrows():
         x = snp[pos_col]
         y = snp[neglog10p_col]
-        # Determine label text
+        # Use SNP ID as label
         label = str(snp[rs_col])
-        # Try to get gene name if genes_df provided
-        if genes_df is not None and chrom is not None:
-            nearest_gene = get_nearest_gene(genes_df, chrom, int(x))
-            if nearest_gene:
-                label = nearest_gene
+        # Skip duplicate labels
+        if label in used_labels:
+            continue
+        used_labels.add(label)
         # Truncate long labels
         if len(label) > max_label_length:
             label = label[: max_label_length - 3] + "..."
-        # Add text annotation with offset
+        # Add text annotation centered above marker
         text = ax.annotate(
             label,
             xy=(x, y),
-            xytext=(5, 5),
+            xytext=(0, 7),
             textcoords="offset points",
-            fontsize=8,
+            fontsize=6,
             fontweight="bold",
             color="#333333",
-            ha="left",
+            ha="center",
             va="bottom",
             zorder=15,
             bbox=dict(
@@ -101,18 +99,19 @@ def add_snp_labels(
         )
         texts.append(text)
-    # Try to adjust text positions to avoid overlap
-    try:
-        from adjustText import adjust_text
-        adjust_text(
-            texts,
-            ax=ax,
-            arrowprops=dict(arrowstyle="-", color="gray", lw=0.5),
-            expand_points=(1.5, 1.5),
-        )
-    except ImportError:
-        # adjustText not installed, labels may overlap
-        pass
+    # Only use adjustText when there are multiple labels to avoid overlap
+    if len(texts) > 1:
+        try:
+            from adjustText import adjust_text
+            adjust_text(
+                texts,
+                ax=ax,
+                arrowprops=dict(arrowstyle="-", color="gray", lw=0.5),
+                expand_points=(1.5, 1.5),
+            )
+        except ImportError:
+            # adjustText not installed, labels may overlap
+            pass
     return texts

pylocuszoom/ld.py CHANGED Viewed

@@ -38,7 +38,7 @@ def build_ld_command(
     output_path: str,
     window_kb: int = 500,
     ld_window_r2: float = 0.0,
-    species: str = "dog",
+    species: str = "canine",
     threads: Optional[int] = None,
 ) -> list:
     """Build PLINK command for LD calculation.
@@ -50,7 +50,7 @@ def build_ld_command(
         output_path: Output prefix (creates .ld file).
         window_kb: Window size in kilobases.
         ld_window_r2: Minimum R² to report (0.0 reports all).
-        species: Species flag for PLINK ('dog', 'cat', or None for human).
+        species: Species flag for PLINK ('canine', 'feline', or None for human).
         threads: Number of threads (auto-detect if None).
     Returns:
@@ -58,10 +58,10 @@ def build_ld_command(
     """
     cmd = [plink_path]
-    # Species flag
-    if species == "dog":
+    # Species flag (maps to PLINK's --dog flag)
+    if species == "canine":
         cmd.append("--dog")
-    elif species == "cat":
+    elif species == "feline":
         # PLINK doesn't have --cat, use --chr-set for 18 autosomes + X
         cmd.extend(["--chr-set", "18"])
@@ -119,7 +119,7 @@ def calculate_ld(
     window_kb: int = 500,
     plink_path: Optional[str] = None,
     working_dir: Optional[str] = None,
-    species: str = "dog",
+    species: str = "canine",
     threads: Optional[int] = None,
 ) -> pd.DataFrame:
     """Calculate LD (R²) between a lead SNP and all SNPs in a region.
@@ -133,7 +133,7 @@ def calculate_ld(
         window_kb: Window size in kilobases around lead SNP.
         plink_path: Path to PLINK executable. Auto-detects if None.
         working_dir: Directory for PLINK output files. Uses temp dir if None.
-        species: Species flag ('dog', 'cat', or None for human).
+        species: Species flag ('canine', 'feline', or None for human).
         threads: Number of threads for PLINK.
     Returns:
@@ -142,6 +142,7 @@ def calculate_ld(
     Raises:
         FileNotFoundError: If PLINK executable not found.
+        ValidationError: If PLINK binary files (.bed/.bim/.fam) are missing.
     Example:
         >>> ld_df = calculate_ld(

pylocuszoom 0.1.0__py3-none-any.whl → 0.3.0__py3-none-any.whl

pylocuszoom 0.1.0py3-none-any.whl → 0.3.0py3-none-any.whl