PyPI - biopipen - Versions diffs - 0.31.3__py3-none-any.whl → 0.31.5__py3-none-any.whl - Mend

biopipen 0.31.3py3-none-any.whl → 0.31.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biopipen might be problematic. Click here for more details.

Files changed (17) hide show

biopipen/__init__.py +1 -1
biopipen/ns/bam.py +41 -0
biopipen/ns/plot.py +1 -1
biopipen/ns/protein.py +84 -0
biopipen/ns/vcf.py +1 -1
biopipen/reports/protein/ProdigySummary.svelte +16 -0
biopipen/scripts/bam/BamMerge.py +10 -14
biopipen/scripts/bam/BamSampling.py +90 -0
biopipen/scripts/plot/VennDiagram.R +1 -5
biopipen/scripts/protein/Prodigy.py +119 -0
biopipen/scripts/protein/ProdigySummary.R +133 -0
biopipen/scripts/scrna/SeuratMap2Ref.R +3 -3
biopipen/utils/plot.R +1 -1
{biopipen-0.31.3.dist-info → biopipen-0.31.5.dist-info}/METADATA +2 -2
{biopipen-0.31.3.dist-info → biopipen-0.31.5.dist-info}/RECORD +17 -12
{biopipen-0.31.3.dist-info → biopipen-0.31.5.dist-info}/entry_points.txt +1 -0
{biopipen-0.31.3.dist-info → biopipen-0.31.5.dist-info}/WHEEL +0 -0

biopipen/__init__.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "0.31.3"
1	+ __version__ = "0.31.5"

biopipen/ns/bam.py CHANGED Viewed

@@ -260,3 +260,44 @@ class BamMerge(Proc):
         "sort_args": [],
     }
     script = "file://../scripts/bam/BamMerge.py"
+class BamSampling(Proc):
+    """Keeping only a fraction of read pairs from a bam file
+    Input:
+        bamfile: The bam file
+    Output:
+        outfile: The output bam file
+    Envs:
+        ncores: Number of cores to use
+        samtools: Path to samtools executable
+        tool: The tool to use, currently only "samtools" is supported
+        fraction (type=float): The fraction of reads to keep.
+            If `0 < fraction <= 1`, it's the fraction of reads to keep.
+            If `fraction > 1`, it's the number of reads to keep.
+            Note that when fraction > 1, you may not get the exact number
+            of reads specified but a close number.
+        seed: The seed for random number generator
+        index: Whether to index the output bam file
+        sort: Whether to sort the output bam file
+        sort_args: The arguments for sorting bam file using `samtools sort`.
+            These keys are not allowed: `-o`, `-@`,
+            and `--threads`, as they are managed by the script.
+    """
+    input = "bamfile:file"
+    output = "outfile:file:{{in.bamfile | stem}}.sampled{{envs.fraction}}.bam"
+    lang = config.lang.python
+    envs = {
+        "ncores": config.misc.ncores,
+        "samtools": config.exe.samtools,
+        "tool": "samtools",
+        "fraction": None,
+        "seed": 8525,
+        "index": True,
+        "sort": True,
+        "sort_args": [],
+    }
+    script = "file://../scripts/bam/BamSampling.py"

biopipen/ns/plot.py CHANGED Viewed

@@ -35,7 +35,7 @@ class VennDiagram(Proc):
     envs = {
         "inopts": {"row.names": -1, "header": False},
         "intype": "raw",
-        "devpars": {"res": 100, "width": 1000, "height": 1000},
+        "devpars": {"res": 100, "width": 800, "height": 600},
         "args": {},
         "ggs": None,
     }

biopipen/ns/protein.py ADDED Viewed

@@ -0,0 +1,84 @@
+"""Protein-related processes."""
+from ..core.proc import Proc
+from ..core.config import config
+class Prodigy(Proc):
+    """Prediction of binding affinity of protein-protein complexes based on
+    intermolecular contacts using Prodigy.
+    See <https://rascar.science.uu.nl/prodigy/> and
+    <https://github.com/haddocking/prodigy>.
+    `prodigy-prot` must be installed under the given python of `proc.lang`.
+    Input:
+        infile: The structure file in PDB or mmCIF format.
+    Output:
+        outfile: The output file generated by Prodigy.
+        outdir: The output directory containing all output files.
+    Envs:
+        distance_cutoff (type=float): The distance cutoff to calculate intermolecular
+            contacts.
+        acc_threshold (type=float): The accessibility threshold for BSA analysis.
+        temperature (type=float): The temperature (C) for Kd prediction.
+        contact_list (flag): Whether to generate contact list.
+        pymol_selection (flag): Whether output a script to highlight the interface
+            residues in PyMOL.
+        selection (list): The selection of the chains to analyze.
+            `['A', 'B']` will analyze chains A and B.
+            `['A,B', 'C']` will analyze chain A and C; and B and C.
+            `['A', 'B', 'C']` will analyze all combinations of A, B, and C.
+        outtype (choice): Set the format of the output file (`out.outfile`).
+            All three files will be generated. This option only determines which
+            is assigned to `out.outfile`.
+            - raw: The raw output file from prodigy.
+            - json: The output file in JSON format.
+            - tsv: The output file in CSV format.
+    """
+    input = "infile:file"
+    output = [
+        "outfile:file:{{in.infile | stem}}_prodigy/"
+        "{{in.infile | stem}}.{{envs.outtype if envs.outtype != 'raw' else 'out'}}",
+        "outdir:dir:{{in.infile | stem}}_prodigy",
+    ]
+    lang = config.lang.python
+    envs = {
+        "distance_cutoff": 5.5,
+        "acc_threshold": 0.05,
+        "temperature": 25.0,
+        "contact_list": True,
+        "pymol_selection": True,
+        "selection": None,
+        "outtype": "json",
+    }
+    script = "file://../scripts/protein/Prodigy.py"
+class ProdigySummary(Proc):
+    """Summary of the output from `Prodigy`.
+    Input:
+        infiles: The output json file generated by `Prodigy`.
+    Output:
+        outdir: The directory of summary files generated by `ProdigySummary`.
+    Envs:
+        group (type=auto): The group of the samples for boxplots.
+            If `None`, don't do boxplots.
+            It can be a dict of group names and sample names, e.g.
+            `{"group1": ["sample1", "sample2"], "group2": ["sample3"]}`
+            or a file containing the group information, with the first column
+            being the sample names and the second column being the group names.
+            The file should be tab-delimited with no header.
+    """
+    input = "infiles:files"
+    input_data = lambda ch: [[f"{odir}/_prodigy.tsv" for odir in ch.outdir]]
+    output = "outdir:dir:prodigy_summary"
+    lang = config.lang.rscript
+    envs = {"group": None}
+    script = "file://../scripts/protein/ProdigySummary.R"
+    plugin_opts = {"report": "file://../reports/protein/ProdigySummary.svelte"}

biopipen/ns/vcf.py CHANGED Viewed

@@ -463,7 +463,7 @@ class BcftoolsAnnotate(Proc):
         columns (auto): Comma-separated or list of columns or tags to carry over from
             the annotation file. Overrides `-c, --columns`
         remove (auto): Remove the specified columns from the input file
-        header (type=list): Headers to be added
+        header (list): Headers to be added
         gz (flag): Whether to gzip the output file
         index (flag): Whether to index the output file (tbi) (`envs.gz` forced to True)
         <more>: Other arguments for `bcftools annotate`

biopipen/reports/protein/ProdigySummary.svelte ADDED Viewed

@@ -0,0 +1,16 @@
+{% from "utils/misc.liq" import report_jobs -%}
+<script>
+    import { Image, DataTable, Descr } from "$libs";
+</script>
+{%- macro report_job(job, h=1) -%}
+    {{ job | render_job: h=h }}
+{%- endmacro -%}
+{%- macro head_job(job) -%}
+    <h1>{{job.out.outdir | stem | escape}}</h1>
+{%- endmacro -%}
+{{ report_jobs(jobs, head_job, report_job) }}

biopipen/scripts/bam/BamMerge.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from pathlib import Path
-from biopipen.utils.misc import run_command
+from biopipen.utils.misc import run_command, logger
-bamfiles = {{in.bamfiles | repr}}  # pyright: ignore
+bamfiles = {{in.bamfiles | repr}}  # pyright: ignore # noqa
 outfile = Path({{out.outfile | repr}})  # pyright: ignore
 ncores = {{envs.ncores | int}}  # pyright: ignore
 tool = {{envs.tool | quote}}  # pyright: ignore
@@ -18,7 +18,7 @@ if should_index and not should_sort:
 def use_samtools():
     """Use samtools to merge bam files"""
-    print("Using samtools")
+    logger.info("Using samtools ...")
     ofile = (
         outfile
         if not should_sort
@@ -43,11 +43,11 @@ def use_samtools():
         *merge_args,
         *bamfiles,
     ]
-    print("- Merging")
+    logger.info("- Merging the bam files ...")
     run_command(cmd)
     if should_sort:
-        print("- Sorting")
+        logger.info("- Sorting the merged bam file ...")
         for key in ["-o", "-@", "--threads"]:
             if key in sort_args:
                 raise ValueError(
@@ -67,16 +67,14 @@ def use_samtools():
         run_command(cmd)
     if should_index:
-        print("- Indexing")
+        logger.info("- Indexing the output bam file ...")
         cmd = [samtools, "index", "-@", ncores, outfile]
         run_command(cmd)
-    print("Done")
 def use_sambamba():
     """Use sambamba to merge bam files"""
-    print("Using sambamba")
+    logger.info("Using sambamba ...")
     ofile = (
         outfile
         if not should_sort
@@ -90,11 +88,11 @@ def use_sambamba():
             )
     cmd = [sambamba, "merge", "-t", ncores, *merge_args, ofile, *bamfiles]
-    print("- Merging")
+    logger.info("- Merging the bam files ...")
     run_command(cmd)
     if should_sort:
-        print("- Sorting")
+        logger.info("- Sorting the merged bam file ...")
         for key in ["-t", "--nthreads", "-o", "--out"]:
             if key in sort_args:
                 raise ValueError(
@@ -115,12 +113,10 @@ def use_sambamba():
         run_command(cmd)
     if should_index:
-        print("- Indexing")
+        logger.info("- Indexing the output bam file ...")
         cmd = [sambamba, "index", "-t", ncores, outfile]
         run_command(cmd)
-    print("Done")
 if __name__ == "__main__":
     if tool == "samtools":

biopipen/scripts/bam/BamSampling.py ADDED Viewed

@@ -0,0 +1,90 @@
+from pathlib import Path
+from biopipen.utils.misc import run_command, logger
+# using:
+# samtools view --subsample 0.1 --subsample-seed 1234 --threads 4 -b -o out.bam in.bam
+bamfile = {{ in.bamfile | repr }} # pyright: ignore # noqa
+outfile = Path({{ out.outfile | repr }}) # pyright: ignore
+ncores = {{ envs.ncores | int }} # pyright: ignore
+samtools = {{ envs.samtools | repr }} # pyright: ignore
+tool = {{ envs.tool | repr }} # pyright: ignore
+fraction = {{ envs.fraction | repr }} # pyright: ignore
+seed = {{ envs.seed | int }} # pyright: ignore
+should_index = {{ envs.index | repr }} # pyright: ignore
+should_sort = {{ envs.sort | repr }} # pyright: ignore
+sort_args = {{ envs.sort_args | repr }} # pyright: ignore
+if should_index and not should_sort:
+    raise ValueError("Indexing requires sorting")
+if fraction is None:
+    raise ValueError("'envs.fraction' must be provided.")
+if tool != "samtools":
+    raise ValueError(
+        f"Tool {tool} is not supported. "
+        "Currently only samtools is supported."
+    )
+if fraction > 1:
+    # calculate the fraction based on the number of reads
+    logger.info("Converting fraction > 1 to a fraction of reads.")
+    cmd = [
+        samtools,
+        "view",
+        "--threads",
+        ncores,
+        "-c",
+        bamfile
+    ]
+    nreads = run_command(cmd, stdout="return").strip()
+    fraction = fraction / float(int(nreads))
+ofile = (
+    outfile
+    if not should_sort
+    else outfile.with_stem(f"{outfile.stem}.unsorted")
+)
+cmd = [
+    samtools,
+    "view",
+    "--subsample",
+    fraction,
+    "--subsample-seed",
+    seed,
+    "--threads",
+    ncores,
+    "-b",
+    "-o",
+    ofile,
+    bamfile
+]
+run_command(cmd, fg=True)
+if should_sort:
+    logger.info("Sorting the output bam file.")
+    for key in ["-o", "-@", "--threads"]:
+        if key in sort_args:
+            raise ValueError(
+                f"envs.sort_args cannot contain {key}, "
+                "which is managed by the script"
+            )
+    cmd = [
+        samtools,
+        "sort",
+        "-@",
+        ncores,
+        *sort_args,
+        "-o",
+        outfile,
+        ofile
+    ]
+    run_command(cmd, fg=True)
+if should_index:
+    logger.info("Indexing the output bam file.")
+    cmd = [samtools, "index", "-@", ncores, outfile]
+    run_command(cmd, fg=True)

biopipen/scripts/plot/VennDiagram.R CHANGED Viewed

@@ -1,8 +1,6 @@
 {{ biopipen_dir | joinpaths: "utils", "io.R" | source_r }}
 {{ biopipen_dir | joinpaths: "utils", "plot.R" | source_r }}
-library(dplyr)
 infile = {{in.infile | quote}}
 outfile = {{out.outfile | quote}}
 inopts = {{envs.inopts | r}}
@@ -18,9 +16,7 @@ if (intype == "raw") {
     indata = lapply(indata, function(x) unlist(strsplit(x, ",", fixed=TRUE)))
 } else { # computed
     elems = rownames(indata)
-    indata = indata %>%
-        mutate(across(everything(), function(x) elems[as.logical(x)])) %>%
-        as.list()
+    indata = apply(indata, 2, function(x) elems[as.logical(x)])
 }
 plotVenn(

biopipen/scripts/protein/Prodigy.py ADDED Viewed

@@ -0,0 +1,119 @@
+import json
+import logging
+import sys
+from pathlib import Path
+from prodigy_prot.predict_IC import (
+    Prodigy,
+    check_path,
+    parse_structure,
+)
+infile = {{in.infile | repr}}  # pyright: ignore # noqa
+outfile = {{out.outfile | repr}}  # pyright: ignore
+outdir = {{out.outdir | repr}}  # pyright: ignore
+distance_cutoff = {{envs.distance_cutoff | float}}  # pyright: ignore
+acc_threshold = {{envs.acc_threshold | float}}  # pyright: ignore
+temperature = {{envs.temperature | float}}  # pyright: ignore
+contact_list = {{envs.contact_list | repr}}  # pyright: ignore
+pymol_selection = {{envs.pymol_selection | repr}}  # pyright: ignore
+selection = {{envs.selection | repr}}  # pyright: ignore
+outtype = {{envs.outtype | repr}}  # pyright: ignore
+raw_outfile = Path(outdir) / "_prodigy_raw.txt"
+json_outfile = Path(outdir) / "_prodigy.json"
+tsv_outfile = Path(outdir) / "_prodigy.tsv"
+# log to the raw_outfile
+logging.basicConfig(level=logging.INFO, stream=sys.stdout, format="%(message)s")
+logger = logging.getLogger("Prodigy")
+if isinstance(selection, str):
+    selection = [selection]
+struct_path = check_path(infile)
+# parse structure
+structure, n_chains, n_res = parse_structure(struct_path)
+logger.info(
+    "[+] Parsed structure file {0} ({1} chains, {2} residues)".format(
+        structure.id, n_chains, n_res
+    )
+)
+prodigy = Prodigy(structure, selection, temperature)
+prodigy.predict(distance_cutoff=distance_cutoff, acc_threshold=acc_threshold)
+prodigy.print_prediction(outfile=raw_outfile, quiet=False)
+# Print out interaction network
+if contact_list:
+    prodigy.print_contacts(f"{outdir}/prodigy.ic")
+# Print out interaction network
+if pymol_selection:
+    prodigy.print_pymol_script(f"{outdir}/prodigy.pml")
+# [+] Reading structure file: <path/to/structure.cif>
+# [+] Parsed structure file <structure> (4 chains, 411 residues)
+# [+] No. of intermolecular contacts: 191
+# [+] No. of charged-charged contacts: 17
+# [+] No. of charged-polar contacts: 18
+# [+] No. of charged-apolar contacts: 60
+# [+] No. of polar-polar contacts: 5
+# [+] No. of apolar-polar contacts: 41
+# [+] No. of apolar-apolar contacts: 50
+# [+] Percentage of apolar NIS residues: 33.90
+# [+] Percentage of charged NIS residues: 30.48
+# [++] Predicted binding affinity (kcal.mol-1):    -21.3
+# [++] Predicted dissociation constant (M) at 25.0˚C:  2.3e-16
+output = {}
+with open(raw_outfile, "r") as f:
+    for line in f:
+        if line.startswith("[+"):
+            line = line.lstrip("[").lstrip("+").lstrip("]").lstrip()
+            if line.startswith("Reading structure file"):
+                continue
+            if line.startswith("Parsed structure file"):
+                continue
+            key, value = line.split(":", 1)
+            key = key.strip()
+            value = value.strip()
+            if key == "No. of intermolecular contacts":
+                output["nIC"] = int(value)
+            elif key == "No. of charged-charged contacts":
+                output["nCCC"] = int(value)
+            elif key == "No. of charged-polar contacts":
+                output["nCPC"] = int(value)
+            elif key == "No. of charged-apolar contacts":
+                output["nCAPC"] = int(value)
+            elif key == "No. of polar-polar contacts":
+                output["nPPC"] = int(value)
+            elif key == "No. of apolar-polar contacts":
+                output["nAPPC"] = int(value)
+            elif key == "No. of apolar-apolar contacts":
+                output["nAPAPC"] = int(value)
+            elif key.startswith("Percentage of apolar NIS residues"):
+                output["pANISR"] = float(value)
+            elif key.startswith("Percentage of charged NIS residues"):
+                output["pCNISR"] = float(value)
+            elif key.startswith("Predicted binding affinity"):
+                output["BindingAffinity"] = float(value)
+            elif key.startswith("Predicted dissociation constant"):
+                output["DissociationConstant"] = float(value)
+with open(json_outfile, "w") as f:
+    json.dump(output, f, indent=2)
+with open(tsv_outfile, "w") as f:
+    f.write("\t".join(output.keys()) + "\n")
+    f.write("\t".join(map(str, output.values())) + "\n")
+if outtype == "json":
+    json_outfile.rename(outfile)
+    json_outfile.symlink_to(outfile)
+elif outtype == "tsv":
+    tsv_outfile.rename(outfile)
+    tsv_outfile.symlink_to(outfile)
+else:
+    raw_outfile.rename(outfile)
+    raw_outfile.symlink_to(outfile)

biopipen/scripts/protein/ProdigySummary.R ADDED Viewed

@@ -0,0 +1,133 @@
+{{ biopipen_dir | joinpaths: "utils", "misc.R" | source_r }}
+library(rlang)
+library(dplyr)
+library(ggplot2)
+library(ggprism)
+theme_set(theme_prism())
+infiles <- {{in.infiles | r}}
+outdir <- {{out.outdir | r}}
+joboutdir <- {{job.outdir | r}}
+group <- {{envs.group | r}}
+if (is.character(group)) {
+    group <- read.csv(group, header = FALSE, row.names = NULL)
+    colnames(group) <- c("Sample", "Group")
+} else if (is.list(group)) {
+    group <- do_call(
+        rbind,
+        lapply(names(group), function(n) data.frame(Sample = group[[n]], Group = n))
+    )
+} else if (!is.null(group)) {
+    stop(paste0("Invalid group: ", paste0(group, collapse = ", ")))
+}
+log_info("Reading and merging metrics for each sample ...")
+metrics <- NULL
+for (infile in infiles) {
+    sample <- sub("_prodigy$", "", basename(dirname(infile)))
+    log_debug("- Reading metrics from {sample}")
+    metric <- read.table(
+        infile,
+        header = TRUE,
+        sep = "\t",
+        stringsAsFactors = FALSE,
+        check.names = FALSE,
+        row.names = NULL)
+    metric$Sample <- sample
+    metric <- metric %>% select(Sample, everything())
+    if (is.null(metrics)) {
+        metrics <- metric
+    } else {
+        metrics <- rbind(metrics, metric)
+    }
+}
+# Save metrics
+write.table(
+    metrics,
+    file.path(outdir, "metrics.txt"),
+    sep = "\t",
+    quote = FALSE,
+    row.names = FALSE
+)
+add_report(
+    list(kind = "descr", content = "Metrics for all samples"),
+    list(kind = "table", src = file.path(outdir, "metrics.txt")),
+    h1 = "Metrics of all samples"
+)
+METRIC_DESCR = list(
+    nIC = "No. of intermolecular contacts",
+    nCCC = "No. of charged-charged contacts",
+    nCPC = "No. of charged-polar contacts",
+    nCAPC = "No. of charged-apolar contacts",
+    nPPC = "No. of polar-polar contacts",
+    nAPPC = "No. of apolar-polar contacts",
+    nAPAPC = "No. of apolar-apolar contacts",
+    pANISR = "Percentage of apolar NIS residues",
+    pCNISR = "Percentage of charged NIS residues",
+    BindingAffinity = "Predicted binding affinity (kcal.mol^-1)",
+    DissociationConstant = "Predicted dissociation constant (M)"
+)
+if (!is.null(group)) {
+    log_info("Merging group information ...")
+    metrics <- group %>%
+        left_join(metrics, by = "Sample") %>%
+        mutate(Group = factor(Group, levels = unique(Group)))
+}
+log_info("Plotting Prodigy metrics ...")
+for (metric in names(METRIC_DESCR)) {
+    log_info("- {metric}: {METRIC_DESCR[[metric]]}")
+    add_report(
+        list(
+            kind = "descr",
+            content = METRIC_DESCR[[metric]] %||% paste0("Metric: ", metric)
+        ),
+        h1 = metric
+    )
+    # barplot
+    p <- ggplot(metrics, aes(x = Sample, y = !!sym(metric))) +
+        geom_bar(stat = "identity", fill = "steelblue") +
+        labs(x = "Sample", y = metric) +
+        theme(axis.text.x = element_text(angle = 90, hjust = 1))
+    figfile <- file.path(outdir, paste0(slugify(metric), ".barplot.png"))
+    png(figfile, height = 600, res = 100, width = nrow(metrics) * 30 + 200)
+    print(p)
+    dev.off()
+    add_report(
+        list(src = figfile, name = "By Sample"),
+        ui = "table_of_images",
+        h1 = metric
+    )
+    if (is.null(group)) { next }
+    # group: Sample, Group
+    p <- ggplot(metrics, aes(x = Group, y = !!sym(metric))) +
+        geom_boxplot(fill = "steelblue") +
+        labs(x = "Group", y = metric) +
+        theme(axis.text.x = element_text(angle = 90, hjust = 1))
+    figfile <- file.path(outdir, paste0(slugify(metric), ".boxplot.png"))
+    png(figfile, height = 600, res = 100, width = length(unique(metrics$Group)) * 30 + 200)
+    print(p)
+    dev.off()
+    add_report(
+        list(src = figfile, name = "By Group"),
+        ui = "table_of_images",
+        h1 = metric
+    )
+}
+save_report(joboutdir)

biopipen/scripts/scrna/SeuratMap2Ref.R CHANGED Viewed

@@ -90,8 +90,8 @@ for (rname in names(mapquery_args$refdata)) {
     }
 }
-if (refnorm == "auto" && .is_sct(reference)) {
-    refnorm = "SCTransform"
+if (refnorm == "auto") {
+    refnorm = ifelse (.is_sct(reference), "SCTransform", "NormalizeData")
 }
 if (refnorm == "SCTransform") {
     # Check if the reference is SCTransform'ed
@@ -110,7 +110,7 @@ if (refnorm == "SCTransform") {
 } else if (refnorm == "NormalizeData") {
     findtransferanchors_args$normalization.method = "LogNormalize"
 } else {
-    stop("Unknown normalization method: {refnorm}")
+    stop(paste0("Unknown normalization method: ", refnorm))
 }
 # Load Seurat object

biopipen/utils/plot.R CHANGED Viewed

@@ -10,7 +10,7 @@ plotVenn = function(
     # Extra ggplot components in string
     ggs = NULL,
     # Parameters for device (res, width, height) for `png()`
-    devpars = list(res=100, width=1000, height=1000),
+    devpars = list(res=100, width=800, height=600),
     # The output file. If NULL, will return the plot object
     outfile = NULL
 ) {

{biopipen-0.31.3.dist-info → biopipen-0.31.5.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: biopipen
-Version: 0.31.3
+Version: 0.31.5
 Summary: Bioinformatics processes/pipelines that can be run from `pipen run`
 License: MIT
 Author: pwwang
@@ -18,5 +18,5 @@ Requires-Dist: pipen-board[report] (>=0.16,<0.17)
 Requires-Dist: pipen-cli-run (>=0.14,<0.15)
 Requires-Dist: pipen-filters (>=0.14,<0.15)
 Requires-Dist: pipen-poplog (>=0.2.0,<0.3.0)
-Requires-Dist: pipen-runinfo (>=0.7,<0.8) ; extra == "runinfo"
+Requires-Dist: pipen-runinfo (>=0.8,<0.9) ; extra == "runinfo"
 Requires-Dist: pipen-verbose (>=0.12,<0.13)

{biopipen-0.31.3.dist-info → biopipen-0.31.5.dist-info}/RECORD RENAMED Viewed

@@ -1,4 +1,4 @@
-biopipen/__init__.py,sha256=KeJnUdf2sotD3eMjgcCRocii5SSlhH5-B6DNBS_0gO8,23
+biopipen/__init__.py,sha256=VSx4_WLVLq_7UtX4GtNLbObe0lMQRa5JR9eh0ofSz4A,23
 biopipen/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 biopipen/core/config.py,sha256=edK5xnDhM8j27srDzsxubi934NMrglLoKrdcC8qsEPk,1069
 biopipen/core/config.toml,sha256=7IXvviRicZ2D1h6x3BVgbLJ96nsh-ikvZ0sVlQepqFE,1944
@@ -7,7 +7,7 @@ biopipen/core/filters.py,sha256=5bZsbpdW7DCxqiteRdb2gelmXvfqWPmPsFxrpHdWsoE,1298
 biopipen/core/proc.py,sha256=60lUP3PcUAaKbDETo9N5PEIoeOYrLgcSmuytmrhcx8g,912
 biopipen/core/testing.py,sha256=lZ_R5ZbYPO2NPuLHdbzg6HbD_f4j8paVVbyeUqwg6FE,3411
 biopipen/ns/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-biopipen/ns/bam.py,sha256=jLhIztPiKsGfMpDgbcEpsybFskKkquIx9OKyTOc_L7Q,9172
+biopipen/ns/bam.py,sha256=-xVagotsURyOtwKzv72L-2f9P7467OVzgvP96syfHZc,10628
 biopipen/ns/bed.py,sha256=HsTCJge7XNfCZyCBJ4iifNKQ5we4VZSpRx8XL8--y5A,6689
 biopipen/ns/cellranger.py,sha256=yPBoNzVSY74J7uyVucaob5lqZKKru5-hYSM4f4Nr2OY,5553
 biopipen/ns/cellranger_pipeline.py,sha256=EWkPJTujamNSMQoRnKfhUiIj6TkMfRmCSUbPfd8Tv8E,4011
@@ -18,7 +18,8 @@ biopipen/ns/delim.py,sha256=fejsh4KW1TG5oMZzAC238LvQhBz7brXkfl3BHfnLK5M,5612
 biopipen/ns/gene.py,sha256=rty-Bjcf87v2vyb9X4kRvfrQ6XQYXgN4f2ftFO0nWA8,3888
 biopipen/ns/gsea.py,sha256=EsNRAPYsagaV2KYgr4Jv0KCnZGqayM209v4yOGGTIOI,7423
 biopipen/ns/misc.py,sha256=qXcm0RdR6W-xpYGgQn3v7JBeYRWwVm5gtgSj2tdVxx4,2935
-biopipen/ns/plot.py,sha256=_dGLKpyHiJqLIIQu5tqCk8H5BkgGBh_qRUZHkjnOgtE,18080
+biopipen/ns/plot.py,sha256=XzLq0A8qCIQRbxhPEdWhEfbRZ8g3e4KriVz0RP8enNY,18078
+biopipen/ns/protein.py,sha256=33pzM-gvBTw0jH60mvfqnriM6uw2zj3katZ82nC9owI,3309
 biopipen/ns/regulatory.py,sha256=qvc9QrwgwCI_lg0DQ2QOZbAhC8BAD1qnQXSGtAGlVcY,11750
 biopipen/ns/rnaseq.py,sha256=bKAa6friFWof4yDTWZQahm1MS-lrdetO1GqDKdfxXYc,7708
 biopipen/ns/scrna.py,sha256=fXP_h7gchcuk_Jwos0IgY_P8ON6Q995OgKHgdrxfvAY,112868
@@ -27,7 +28,7 @@ biopipen/ns/snp.py,sha256=-Jx5Hsv_7KV7TqLU0nHCaPkMEN0CFdi4tNVlyq0rUZ4,27259
 biopipen/ns/stats.py,sha256=DlPyK5Vsg6ZEkV9SDS3aAw21eXzvOHgqeZDkXPhg7go,20509
 biopipen/ns/tcgamaf.py,sha256=AFbUJIxiMSvsVY3RcHgjRFuMnNh2DG3Mr5slLNEyz6o,1455
 biopipen/ns/tcr.py,sha256=0PCF8iPZ629z6P3RHoAWEpMWmuDslomTGcMopjqvXmE,88304
-biopipen/ns/vcf.py,sha256=0aKH_YSLy_-JzV-_VZb0EoScv7JKGrDU7BaeWHjDuRo,22699
+biopipen/ns/vcf.py,sha256=zidwskYZ3IIY1sAKYp6WXOiEOdrJjw438JQW1TC7l9s,22694
 biopipen/ns/web.py,sha256=4itJzaju8VBARIyZjDeh5rsVKpafFq_whixnvL8sXes,5368
 biopipen/reports/bam/CNAClinic.svelte,sha256=D4IxQcgDCPQZMbXog-aZP5iJEQTK2N4i0C60e_iXyfs,213
 biopipen/reports/bam/CNVpytor.svelte,sha256=s03SlhbEPd8-_44Dy_cqE8FSErhUdqStLK39te5o7ZE,1364
@@ -44,6 +45,7 @@ biopipen/reports/cnvkit/CNVkitScatter.svelte,sha256=8QLihBVH8RaHtjOUTU7xh4CCmFyx
 biopipen/reports/delim/SampleInfo.svelte,sha256=Vpjrdd3AXNDNhx2pzDaFA61xPMYAFKvvIoVCqUswiyo,365
 biopipen/reports/gsea/FGSEA.svelte,sha256=3gNbZovmRWK6QjtxfgZgmft6LUurVZfQyHBRqyGMosk,405
 biopipen/reports/gsea/GSEA.svelte,sha256=lYHf8h8RLx3i-jNCEGu_LM-dbYm9ZJDzyAEadsZXzmQ,417
+biopipen/reports/protein/ProdigySummary.svelte,sha256=WEYPwmcmgtSqpFpTvNPV40yZR-7ERa5LgZni2RXxUZQ,348
 biopipen/reports/scrna/CellsDistribution.svelte,sha256=Mg6P0tazpzOxsOAtc-0LGEim5KprPt5KIgoW3TzrxxA,413
 biopipen/reports/scrna/DimPlots.svelte,sha256=ZLbtN0ioevRyEky4jb_DkDGAcpy_jAhaHfFym5ELEPM,479
 biopipen/reports/scrna/MarkersFinder.svelte,sha256=77rD1psj0VJykPDhfwS-B8mubvaasREAE6RYR2atTN4,444
@@ -74,7 +76,8 @@ biopipen/reports/utils/gsea.liq,sha256=5uxNPyIr0xd7nrZePJlIsRyqCPx1uVWso7ehE1F-C
 biopipen/reports/utils/misc.liq,sha256=HLK3mkWtIMQqBtM2IIRFUdKKTcY8cvBtyHJB9DbWBdw,1653
 biopipen/reports/vcf/TruvariBenchSummary.svelte,sha256=yew8HRN-YahBzX504Micah5BTnoL_PQzQfN_87TiuOA,577
 biopipen/reports/vcf/TruvariConsistency.svelte,sha256=BBvtxi1EPmGH7j5M5zMOcLEhKWZOlKoXp1lrQGAmz_0,647
-biopipen/scripts/bam/BamMerge.py,sha256=jyaJI0-TulAxaCzvrYjC8PujH_ECNInevnPbh2_XQtU,3477
+biopipen/scripts/bam/BamMerge.py,sha256=Gd5P8V-CSsTAA8ZrUxetR-I49GjJ3VJNjrqu7-EZwXQ,3642
+biopipen/scripts/bam/BamSampling.py,sha256=Pi6CXAbBFVRGh8-0WrkB-3v3oxinfahQk11H0IdBNmQ,2312
 biopipen/scripts/bam/BamSplitChroms.py,sha256=b7GS2I4X0dLOhlPg_r9-buoIHTWlq6zHI3Rox94LXR8,4893
 biopipen/scripts/bam/CNAClinic.R,sha256=mQXwtShL54HZXGCPqgPKPrU74_6K_8PqtOtG0mgA-F0,5062
 biopipen/scripts/bam/CNVpytor.py,sha256=hOUli9BDMOoth0or-tjUYC1AP3yNOuxUS6G3Rhcg99s,18000
@@ -120,7 +123,9 @@ biopipen/scripts/plot/Manhattan.R,sha256=7lJwCX1d0zUpJVhVcmQ35ZtQELzkaDNnBTNHHc3
 biopipen/scripts/plot/QQPlot.R,sha256=Xil19FJ7jbsxo1yU7dBhhZo2_95Gz6gpTyuv9F0RDNM,4115
 biopipen/scripts/plot/ROC.R,sha256=cjmmYRQycYisqRmlkZE9nbmwfo-04wdJKVmlOsiEFAM,2451
 biopipen/scripts/plot/Scatter.R,sha256=fg4H5rgdr6IePTMAIysiElnZme0vCh1T0wrwH2Q9xkM,2840
-biopipen/scripts/plot/VennDiagram.R,sha256=IQG4OLXdORbmKMWca7dtSDX_RdH8FCrpDfi3eMae7G8,773
+biopipen/scripts/plot/VennDiagram.R,sha256=Am9umSGr2QxZc2MIMGMBhpoEqta3qt_ItF-9_Y53SXE,704
+biopipen/scripts/protein/Prodigy.py,sha256=W56e51SkaWqthrkCSr2HUqhE9NfJQWZj4y0HXIqaYRA,4459
+biopipen/scripts/protein/ProdigySummary.R,sha256=1s3ofk6Kvs--GAAvzV8SdAyq5LrYozWtIlL32b6ZarE,3806
 biopipen/scripts/regulatory/MotifAffinityTest.R,sha256=1sR3sWRZbxDeFO290LcpzZglzOLc13SSvibDON96PCg,8852
 biopipen/scripts/regulatory/MotifAffinityTest_AtSNP.R,sha256=SAyTm2-6g5qVJFRrLxEY0QJrLWTkwDi_J_9J7HhtTN8,4438
 biopipen/scripts/regulatory/MotifAffinityTest_MotifBreakR.R,sha256=wCK4tLx1iWh_OwW7ZvLTCjTGWCIfVqw-lYC0-JqIPqg,3338
@@ -164,7 +169,7 @@ biopipen/scripts/scrna/SeuratClustering-common.R,sha256=JX4Cn2FC6GOcBqaVyGDD3MM5
 biopipen/scripts/scrna/SeuratClustering.R,sha256=0OKRBQ5rFuupK7c03_sSt2HMwMdMnCYFqTvkRXFKchs,1706
 biopipen/scripts/scrna/SeuratFilter.R,sha256=BrYK0MLdaTtQvInMaQsmOt7oH_hlks0M1zykkJtg2lM,509
 biopipen/scripts/scrna/SeuratLoading.R,sha256=ekWKnHIqtQb3kHVQiVymAHXXqiUxs6KKefjZKjaykmk,900
-biopipen/scripts/scrna/SeuratMap2Ref.R,sha256=KARt5IVBDYpNhLZ7_j0FEi1u5S8PxU_mB4THH26s7AM,12008
+biopipen/scripts/scrna/SeuratMap2Ref.R,sha256=B0RZ2k1IUKdhe34SjU-8CxvYGj7ub-z7JJaSE0snCok,12040
 biopipen/scripts/scrna/SeuratMetadataMutater.R,sha256=PMwG0Xvl_EEVKkicfrIi4arEqpY948PkYLkb59kTAXI,1135
 biopipen/scripts/scrna/SeuratPreparing-common.R,sha256=WuD7lGS17eAUQWSiIdAoV0EIeqS3Tnkkx-7PbP6Q3tc,16279
 biopipen/scripts/scrna/SeuratPreparing-doublet_detection.R,sha256=TNN2lfFjpnnO0rguMsG38JYCP1nFUhcPLJ1LqGj-Sc8,6674
@@ -274,12 +279,12 @@ biopipen/utils/io.R,sha256=jIYdqdn0iRWfQYAZa5CjXi3fikqmYvPPLIXhobRe8sw,537
 biopipen/utils/misc.R,sha256=qTninxi9XAM_3QJqwThflGA-j7p1aKpQ9Pjmix6Iy3U,12059
 biopipen/utils/misc.py,sha256=nkQHa3GMc7Ce0N2GKmucbRc8BMXgZ2yr_SPbq9RYA4s,3740
 biopipen/utils/mutate_helpers.R,sha256=Bqy6Oi4rrPEPJw0Jq32bVAwwBfZv7JJL9jFcK5x-cek,17649
-biopipen/utils/plot.R,sha256=pzl37PomNeUZPxohHZ2w93j3Fc4T0Qrc62FF-9MTKdw,4417
+biopipen/utils/plot.R,sha256=fmWnCv6EpOU8NvHFvShbdPRqB659vHcDlJAqWIXM8XQ,4415
 biopipen/utils/reference.py,sha256=oi5evicLwHxF0KAIPNZohBeHJLJQNWFJH0cr2y5pgcg,5873
 biopipen/utils/rnaseq.R,sha256=Ro2B2dG-Z2oVaT5tkwp9RHBz4dp_RF-JcizlM5GYXFs,1298
 biopipen/utils/single_cell.R,sha256=pJjYP8bIZpNAtTQ32rOXhZxaM1Y-6D-xUcK3pql9tbk,4316
 biopipen/utils/vcf.py,sha256=ajXs0M_QghEctlvUlSRjWQIABVF02wPdYd-0LP4mIsU,9377
-biopipen-0.31.3.dist-info/METADATA,sha256=8EHJ3ymJf16BFc_fq11-5SnzC3XwuJw67fXEpe2vYlM,882
-biopipen-0.31.3.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-biopipen-0.31.3.dist-info/entry_points.txt,sha256=69SbeMaF47Z2DS40yo-qDyoBKmMmumrNnsjEZMOioCE,625
-biopipen-0.31.3.dist-info/RECORD,,
+biopipen-0.31.5.dist-info/METADATA,sha256=mRJi-cY3E8tLValjumEgu28oAiy5NNpFMQRsrNiRPVg,882
+biopipen-0.31.5.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+biopipen-0.31.5.dist-info/entry_points.txt,sha256=BYqHGBQJxyFDNLYqgH64ycI5PYwnlqwYcCFsMvJgzAU,653
+biopipen-0.31.5.dist-info/RECORD,,

{biopipen-0.31.3.dist-info → biopipen-0.31.5.dist-info}/entry_points.txt RENAMED Viewed

@@ -11,6 +11,7 @@ gene=biopipen.ns.gene
 gsea=biopipen.ns.gsea
 misc=biopipen.ns.misc
 plot=biopipen.ns.plot
+protein=biopipen.ns.protein
 regulatory=biopipen.ns.regulatory
 rnaseq=biopipen.ns.rnaseq
 scrna=biopipen.ns.scrna

{biopipen-0.31.3.dist-info → biopipen-0.31.5.dist-info}/WHEEL RENAMED Viewed

File without changes

biopipen 0.31.3__py3-none-any.whl → 0.31.5__py3-none-any.whl

Potentially problematic release.

biopipen 0.31.3py3-none-any.whl → 0.31.5py3-none-any.whl