PyPI - biopipen - Versions diffs - 0.27.1__py3-none-any.whl → 0.27.3__py3-none-any.whl - Mend

biopipen 0.27.1py3-none-any.whl → 0.27.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biopipen might be problematic. Click here for more details.

Files changed (18) hide show

biopipen/__init__.py +1 -1
biopipen/ns/scrna.py +8 -0
biopipen/ns/snp.py +18 -15
biopipen/ns/tcr.py +73 -0
biopipen/scripts/scrna/MarkersFinder.R +30 -5
biopipen/scripts/scrna/MetaMarkers.R +17 -3
biopipen/scripts/scrna/RadarPlots.R +2 -2
biopipen/scripts/scrna/ScFGSEA.R +21 -4
biopipen/scripts/scrna/SeuratPreparing.R +113 -1
biopipen/scripts/snp/PlinkSimulation.py +119 -83
biopipen/scripts/stats/DiffCoexpr.R +3 -3
biopipen/scripts/tcr/CloneResidency.R +16 -4
biopipen/scripts/tcr/TCRDock.py +106 -0
biopipen/utils/misc.py +5 -1
{biopipen-0.27.1.dist-info → biopipen-0.27.3.dist-info}/METADATA +3 -2
{biopipen-0.27.1.dist-info → biopipen-0.27.3.dist-info}/RECORD +18 -17
{biopipen-0.27.1.dist-info → biopipen-0.27.3.dist-info}/WHEEL +0 -0
{biopipen-0.27.1.dist-info → biopipen-0.27.3.dist-info}/entry_points.txt +0 -0

biopipen/__init__.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "0.27.1"
1	+ __version__ = "0.27.3"

biopipen/ns/scrna.py CHANGED Viewed

@@ -201,6 +201,13 @@ class SeuratPreparing(Proc):
                 - scvi: Same as `scVIIntegration`.
             - <more>: See <https://satijalab.org/seurat/reference/integratelayers>
+        DoubletFinder (ns): Arguments to run [`DoubletFinder`](https://github.com/chris-mcginnis-ucsf/DoubletFinder).
+            See also <https://demultiplexing-doublet-detecting-docs.readthedocs.io/en/latest/DoubletFinder.html>.
+            To disable `DoubletFinder`, set `envs.DoubletFinder` to `None` or `False`; or set `pcs` to `0`.
+            - PCs (type=int): Number of PCs to use for 'doubletFinder' function.
+            - doublets (type=float): Number of expected doublets as a proportion of the pool size.
+            - pN (type=float): Number of doublets to simulate as a proportion of the pool size.
     Requires:
         r-seurat:
             - check: {{proc.lang}} <(echo "library(Seurat)")
@@ -227,6 +234,7 @@ class SeuratPreparing(Proc):
             "min_cells": 5,
         },
         "IntegrateLayers": {"method": "harmony"},
+        "DoubletFinder": {"PCs": 0, "pN": 0.25, "doublets": 0.075},
     }
     script = "file://../scripts/scrna/SeuratPreparing.R"
     plugin_opts = {

biopipen/ns/snp.py CHANGED Viewed

@@ -7,12 +7,15 @@ from ..core.config import config
 class PlinkSimulation(Proc):
     """Simulate SNPs using PLINK v1.9
-    See also <https://www.cog-genomics.org/plink/1.9/input#simulate>.
+    See also <https://www.cog-genomics.org/plink/1.9/input#simulate> and
+    <https://pwwang.github.io/biopipen/api/biopipen.ns.snp/#biopipen.ns.snp.PlinkSimulation>
     Input:
-        nsnps: Number of SNPs to simulate
-        ncases: Number of cases to simulate
-        nctrls: Number of controls to simulate
+        configfile: Configuration file containing the parameters for the simulation.
+            The configuration file (in toml, yaml or json format) should contain a
+            dictionary of parameters.  The parameters are listed in `envs` except
+            `ncores`, which is used for parallelization. You can set parameters
+            in `envs` and override them in the configuration file.
     Output:
         outdir: Output directory containing the simulated data
@@ -21,9 +24,11 @@ class PlinkSimulation(Proc):
             SNPs and columns representing samples.
     Envs:
+        nsnps (type=int): Number of SNPs to simulate
+        ncases (type=int): Number of cases to simulate
+        nctrls (type=int): Number of controls to simulate
         plink: Path to PLINK v1.9
-        seed (type=int): Random seed.
-            If not set, seed will not be set.
+        seed (type=int): Random seed. If not set, seed will not be set.
         label: Prefix label for the SNPs.
         prevalence  (type=float): Disease prevalence.
         minfreq (type=float): Minimum allele frequency.
@@ -41,19 +46,17 @@ class PlinkSimulation(Proc):
             This only affects the sample names in the genotype matrix file
             (`out.gtmat`).
     """
-    input = "nsnps:var, ncases:var, nctrls:var"
+    input = "configfile:file"
     output = [
-        (
-            "outdir:dir:{{in.nsnps | int}}_"
-            "{{in.ncases | int}}xcases_{{in.nctrls | int}}xctrls.plink_sim"
-        ),
-        (
-            "gtmat:file:{{in.nsnps | int}}_"
-            "{{in.ncases | int}}xcases_{{in.nctrls | int}}xctrls.plink_sim/gtmat.txt"
-        ),
+        "outdir:dir:{{in.configfile | stem}}.plink_sim",
+        "gtmat:file:{{in.configfile | stem}}.plink_sim/"
+        "{{in.configfile | stem}}-gtmat.txt",
     ]
     lang = config.lang.python
     envs = {
+        "nsnps": None,
+        "ncases": None,
+        "nctrls": None,
         "plink": config.exe.plink,
         "seed": None,
         "label": "SNP",

biopipen/ns/tcr.py CHANGED Viewed

@@ -983,6 +983,7 @@ class CloneResidency(Proc):
             before calculating the clone residency. For example, `Clones > 1` to filter
             out singletons.
         prefix: The prefix of the cell barcodes in the `Seurat` object.
+        upset_ymax: The maximum value of the y-axis in the upset bar plots.
         upset_trans: The transformation to apply to the y axis of upset bar plots.
             For example, `log10` or `sqrt`. If not specified, the y axis will be
             plotted as is. Note that the position of the bar plots will be dodged
@@ -1007,6 +1008,7 @@ class CloneResidency(Proc):
         "mutaters": {},
         "subset": None,
         "prefix": "{Sample}_",
+        "upset_ymax": None,
         "upset_trans": None,
         "cases": {},
     }
@@ -1595,3 +1597,74 @@ class TESSA(Proc):
     }
     script = "file://../scripts/tcr/TESSA.R"
     plugin_opts = {"report": "file://../reports/tcr/TESSA.svelte"}
+class TCRDock(Proc):
+    """Using TCRDock to predict the structure of MHC-peptide-TCR complexes
+    See <https://github.com/phbradley/TCRdock>.
+    Input:
+        configfile: The config file for TCRDock
+            It's should be a toml file with the keys listed in `envs`, including
+            `organism`, `mhc_class`, `mhc`, `peptide`, `va`, `ja`, `vb`, `jb`,
+            `cdr3a`, and `cdr3b`.
+            The values will overwrite the values in `envs`.
+    Output:
+        outdir: The output directory containing the results
+    Envs:
+        organism: The organism of the TCR, peptide and MHC
+        mhc_class (type=int): The MHC class, either `1` or `2`
+        mhc: The MHC allele, e.g., `A*02:01`
+        peptide: The peptide sequence
+        va: The V alpha gene
+        ja: The J alpha gene
+        vb: The V beta gene
+        jb: The J beta gene
+        cdr3a: The CDR3 alpha sequence
+        cdr3b: The CDR3 beta sequence
+        python: The path of python with dependencies for `tcrdock` installed.
+            If not provided, `TCRDock.lang` will be used (the same interpreter
+            used for the wrapper script).
+            It could also be a list to specify, for example, a python in a conda
+            environment (e.g., `["conda", "run", "-n", "myenv", "python"]`).
+        tmpdir: The temporary directory used to clone the `tcrdock` source code if
+            `envs.tcrdock` is not provided.
+        tcrdock: The path to the `tcrdock` source code repo.
+            You need to clone the source code from the github repository.
+            <https://github.com/phbradley/TCRdock> at
+            revision c5a7af42eeb0c2a4492a4d4fe803f1f9aafb6193 at main branch.
+            You also have to run `download_blast.py` after cloning to download the
+            blast database in the directory.
+            If not provided, we will clone the source code to the `envs.tmpdir`
+            directory and run the `download_blast.py` script.
+        model_name: The model name to use
+        model_file: The model file to use.
+            If provided as a relative path, it should be relative to the
+            `<envs.data_dir>/params/`, otherwise, it should be the full path.
+        data_dir: The data directory that contains the model files.
+            The model files should be in the `params` subdirectory.
+    """
+    input = "configfile:file"
+    output = "outdir:dir:{{in.configfile | stem}}.tcrdock"
+    lang = config.lang.python
+    envs = {
+        "tcrdock": None,
+        "organism": "human",
+        "mhc_class": 1,
+        "mhc": "A*02:01",
+        "peptide": None,
+        "va": None,
+        "ja": None,
+        "vb": None,
+        "jb": None,
+        "cdr3a": None,
+        "cdr3b": None,
+        "python": None,
+        "model_name": "model_2_ptm_ft4",
+        "model_file": "tcrpmhc_run4_af_mhc_params_891.pkl",
+        "data_dir": None,
+    }
+    script = "file://../scripts/tcr/TCRDock.py"

biopipen/scripts/scrna/MarkersFinder.R CHANGED Viewed

@@ -120,7 +120,7 @@ expand_each <- function(name, case) {
                     pull(case$each) %>% na.omit() %>% unique() %>% as.vector()
             }
             for (each in eachs) {
-                by <- make.names(paste0(".", name, "_", case$each,"_", each))
+                by <- make.names(paste0("..", name, "_", case$each,"_", each))
                 srtobj@meta.data <<- srtobj@meta.data %>% mutate(
                     !!sym(by) := if_else(
                         !!sym(case$each) == each,
@@ -364,6 +364,16 @@ add_case_report <- function(info, sigmarkers, siggenes) {
     }
 }
+ensure_sobj <- function(expr, allow_empty) {
+    tryCatch({ expr }, error = function(e) {
+        if (allow_empty) {
+            log_warn("  Ignoring this case: {e$message}")
+            return(NULL)
+        } else {
+            stop(e)
+        }
+    })
+}
 do_case_findall <- function(casename) {
     # casename
@@ -382,10 +392,17 @@ do_case_findall <- function(casename) {
     # args$min.cells.group <- args$min.cells.group %||% 1
     # args$min.cells.feature <- args$min.cells.feature %||% 1
     # args$min.pct <- args$min.pct %||% 0
+    allow_empty = startsWith(case$group.by, "..")
     if (!is.null(case$subset)) {
-        args$object <- srtobj %>% filter(!!parse_expr(case$subset) & !is.na(!!sym(case$group.by)))
+        args$object <- ensure_sobj({
+            srtobj %>% filter(!!parse_expr(case$subset) & !is.na(!!sym(case$group.by)))
+        }, allow_empty)
+        if (is.null(args$object)) { return() }
     } else {
-        args$object <- srtobj %>% filter(!is.na(!!sym(case$group.by)))
+        args$object <- ensure_sobj({
+            srtobj %>% filter(!is.na(!!sym(case$group.by)))
+        }, allow_empty)
+        if (is.null(args$object)) { return() }
     }
     Idents(args$object) <- case$group.by
@@ -486,11 +503,19 @@ do_case <- function(casename) {
     # sigmarkers
     # rest
     args <- case$rest
+    allow_empty = startsWith(case$group.by, "..")
     if (!is.null(case$subset)) {
-        args$object <- srtobj %>% filter(!!parse_expr(case$subset) & !is.na(!!sym(case$group.by)))
+        args$object <- ensure_sobj({
+            srtobj %>% filter(!!parse_expr(case$subset) & !is.na(!!sym(case$group.by)))
+        }, allow_empty)
+        if (is.null(args$object)) { return() }
     } else {
-        args$object <- srtobj %>% filter(!is.na(!!sym(case$group.by)))
+        args$object <- ensure_sobj({
+            srtobj %>% filter(!is.na(!!sym(case$group.by)))
+        }, allow_empty)
+        if (is.null(args$object)) { return() }
     }
     args$assay <- case$assay
     args$group.by <- case$group.by
     args$ident.1 <- case$ident.1

biopipen/scripts/scrna/MetaMarkers.R CHANGED Viewed

@@ -76,7 +76,7 @@ expand_each <- function(name, case) {
                 pull(case$each) %>% unique() %>% na.omit()
         }
         for (each in eachs) {
-            by = make.names(paste0(".", name, "_", case$each, "_", each))
+            by = make.names(paste0("..", name, "_", case$each, "_", each))
             idents <- case$idents
             if (is.null(idents) || length(idents) == 0) {
                 srtobj@meta.data = srtobj@meta.data %>%
@@ -169,17 +169,31 @@ do_enrich <- function(info, markers, sig) {
     }
 }
+ensure_sobj <- function(expr, allow_empty) {
+    tryCatch({ expr }, error = function(e) {
+        if (allow_empty) {
+            log_warn("  Ignoring this case: {e$message}")
+            return(NULL)
+        } else {
+            stop(e)
+        }
+    })
+}
 do_case <- function(casename) {
     log_info("- Dealing with case: {casename} ...")
     info <- casename_info(casename, cases, outdir, create = TRUE)
     case <- cases[[casename]]
+    allow_empty = startsWith(case$group_by, "..")
     if (sum(!is.na(srtobj@meta.data[[case$group_by]])) == 0) {
         msg = "Not enough cells to run tests."
     } else {
-        sobj <- srtobj %>% filter(!is.na(!!sym(case$group_by)))
+        sobj <- ensure_sobj({ srtobj %>% filter(!is.na(!!sym(case$group_by))) }, allow_empty)
+        if (is.null(sobj)) { return() }
         if (!is.null(case$subset)) {
-            sobj <- srtobj %>% filter(!is.na(!!sym(case$group_by)), !!parse_expr(case$subset))
+            sobj <- ensure_sobj({ sobj %>% filter(!!parse_expr(case$subset)) }, allow_empty)
+            if (is.null(sobj)) { return() }
         }
         df <- tryCatch({
                 GetAssayData(sobj, layer = "data")

biopipen/scripts/scrna/RadarPlots.R CHANGED Viewed

@@ -74,10 +74,10 @@ expand_each <- function(name,  case) {
         }
     } else {
         if (is.null(case$subset)) {
-            eachs <- srtobj@meta.data %>%
+            eachs <- meta %>%
                 pull(case$each) %>% unique() %>% na.omit() %>% as.vector()
         } else {
-            eachs <- srtobj@meta.data %>% filter(!!parse_expr(case$subset)) %>%
+            eachs <- meta %>% filter(!!parse_expr(case$subset)) %>%
                 pull(case$each) %>% unique() %>% na.omit() %>% as.vector()
         }
         for (each in eachs) {

biopipen/scripts/scrna/ScFGSEA.R CHANGED Viewed

@@ -72,7 +72,7 @@ expand_each <- function(name, case) {
                 pull(case$each) %>% na.omit() %>% unique() %>% as.vector()
         }
         for (each in eachs) {
-            by <- make.names(paste0(".", name, "_", case$each,"_", each))
+            by <- make.names(paste0("..", name, "_", case$each,"_", each))
             srtobj@meta.data <<- srtobj@meta.data %>%
                 mutate(!!sym(by) := if_else(
                     !!sym(case$each) == each,
@@ -97,18 +97,35 @@ log_info("- Expanding cases...")
 cases <- expand_cases(cases, defaults, expand_each)
+ensure_sobj <- function(expr, allow_empty) {
+    tryCatch({ expr }, error = function(e) {
+        if (allow_empty) {
+            log_warn("  Ignoring this case: {e$message}")
+            return(NULL)
+        } else {
+            stop(e)
+        }
+    })
+}
 do_case <- function(name, case) {
     log_info("- Handling case: {name} ...")
     info <- casename_info(name, cases, outdir, create = TRUE)
+    allow_empty = startsWith(case$group.by, "..")
     # prepare expression matrix
     log_info("  Preparing expression matrix...")
-    sobj <- srtobj %>% filter(!is.na(!!sym(case$group.by)))
+    sobj <- ensure_sobj({ srtobj %>% filter(!is.na(!!sym(case$group.by))) }, allow_empty)
+    if (is.null(sobj)) { return() }
     if (!is.null(case$subset)) {
-        sobj <- sobj %>% filter(!!!parse_exprs(case$subset))
+        sobj <- ensure_sobj({ sobj %>% filter(!!!parse_exprs(case$subset)) }, allow_empty)
+        if (is.null(sobj)) { return() }
     }
     if (!is.null(case$ident.2)) {
-        sobj <- sobj %>% filter(!!sym(case$group.by) %in% c(case$ident.1, case$ident.2))
+        sobj <- ensure_sobj({ sobj %>% filter(!!sym(case$group.by) %in% c(case$ident.1, case$ident.2)) }, allow_empty)
+        if (is.null(sobj)) { return() }
     }
     allclasses <- sobj@meta.data[, case$group.by, drop = TRUE]

biopipen/scripts/scrna/SeuratPreparing.R CHANGED Viewed

@@ -13,6 +13,7 @@ envs = {{envs | r: todot = "-", skip = 1}}
 set.seed(8525)
 options(future.globals.maxSize = 80000 * 1024^2)
+options(future.rng.onMisuse="ignore")
 options(Seurat.object.assay.version = "v5")
 plan(strategy = "multicore", workers = envs$ncores)
@@ -342,7 +343,7 @@ RunPCAArgs$object <- sobj
 sobj <- do_call(RunPCA, RunPCAArgs)
 if (!envs$no_integration) {
-    log_info("- Running IntegrateLayers ...")
+    log_info("- Running IntegrateLayers (method = {envs$IntegrateLayers$method}) ...")
     IntegrateLayersArgs <- envs$IntegrateLayers
     method <- IntegrateLayersArgs$method
     if (!is.null(IntegrateLayersArgs$reference) && is.character(IntegrateLayersArgs$reference)) {
@@ -383,6 +384,117 @@ if (!envs$use_sct) {
     sobj <- JoinLayers(sobj)
 }
+if (!is.null(envs$DoubletFinder) && is.list(envs$DoubletFinder) && envs$DoubletFinder$PCs > 0) {
+    library(DoubletFinder)
+    log_info("Running DoubletFinder ...")
+    log_info("- Preparing Seurat object ...")
+    # More controls from envs?
+    sobj <- FindNeighbors(sobj, dims = 1:envs$DoubletFinder$PCs)
+    sobj <- FindClusters(sobj)
+    log_info("- pK Indentification ...")
+    sweep.res.list <- paramSweep(
+        sobj,
+        PCs = 1:envs$DoubletFinder$PCs,
+        sct = envs$use_sct,
+        num.cores = envs$ncores
+    )
+    sweep.stats <- summarizeSweep(sweep.res.list, GT = FALSE)
+    bcmvn <- find.pK(sweep.stats)
+    bcmvn$Selected <- bcmvn$pK == bcmvn$pK[which.max(bcmvn$BCmetric)[1]]
+    plot <- ggplot(bcmvn, aes(x = pK, y = BCmetric, color = Selected)) +
+        geom_point() +
+        # rotate x axis labels
+        theme(axis.text.x = element_text(angle = 90, hjust = 1))
+    ggsave(plot, filename = file.path(plotsdir, "pK_BCmetric.png"))
+    pK <- bcmvn$pK[which.max(bcmvn$BCmetric)[1]]
+    pK <- as.numeric(as.character(pK))
+    pN <- envs$DoubletFinder$pN
+    log_info("- Homotypic Doublet Proportion Estimate ...")
+    homotypic.prop <- modelHomotypic(Idents(sobj))
+    nExp_poi <- round(nrow(sobj@meta.data) * envs$DoubletFinder$doublets)
+    nExp_poi.adj <- round(nExp_poi * (1 - homotypic.prop))
+    log_info("- Running DoubletFinder ...")
+    sobj <- doubletFinder(
+        sobj,
+        PCs = 1:envs$DoubletFinder$PCs,
+        pN = pN,
+        pK = pK,
+        nExp = nExp_poi.adj,
+        reuse.pANN = FALSE,
+        sct = envs$use_sct
+    )
+    pANN_col <- paste0("pANN_", pN, "_", pK)
+    pANN_col <- colnames(sobj@meta.data)[grepl(pANN_col, colnames(sobj@meta.data))]
+    DF_col <- paste0("DF.classifications_", pN, "_", pK)
+    DF_col <- colnames(sobj@meta.data)[grepl(DF_col, colnames(sobj@meta.data))]
+    doublets <- as.data.frame(
+        cbind(
+            colnames(sobj),
+            sobj@meta.data[, pANN_col],
+            sobj@meta.data[, DF_col]
+        )
+    )
+    colnames(doublets) <-  c("Barcode","DoubletFinder_score","DoubletFinder_DropletType")
+    write.table(
+        doublets,
+        file.path(joboutdir, "DoubletFinder_doublets_singlets.txt"),
+        row.names = FALSE,
+        quote = FALSE,
+        sep = "\t"
+    )
+    summary <- as.data.frame(table(doublets$DoubletFinder_DropletType))
+    colnames(summary) <- c("Classification", "Droplet_N")
+    write.table(
+        summary,
+        file.path(joboutdir, "DoubletFinder_summary.txt"),
+        row.names = FALSE,
+        quote = FALSE,
+        sep = "\t"
+    )
+    # Do a dimplot
+    log_info("- Plotting dimension reduction ...")
+    dimp <- DimPlot(
+        sobj, group.by = DF_col, order = "Doublet",
+        cols = c("#333333", "#FF3333"), pt.size = 0.8, alpha = 0.5)
+    ggsave(dimp, filename = file.path(plotsdir, "DoubletFinder_dimplot.png"))
+    log_info("- Filtering doublets ...")
+    sobj <- subset(sobj, cells = doublets$Barcode[doublets$DoubletFinder_DropletType == "Singlet"])
+    add_report(
+        list(
+            kind = "descr",
+            content = "The table contains the number of cells classified as singlets and doublets."
+        ),
+        list(
+            kind = "table",
+            data = list(path = file.path(joboutdir, "DoubletFinder_summary.txt"))
+        ),
+        h1 = "DoubletFinder Results",
+        h2 = "The DoubletFinder Summary"
+    )
+    add_report(
+        list(
+            name = "pK vs BCmetric",
+            src = file.path(plotsdir, "pK_BCmetric.png")
+        ),
+        list(
+            name = "Dimension Reduction Plot",
+            src = file.path(plotsdir, "DoubletFinder_dimplot.png")
+        ),
+        ui = "table_of_images",
+        h1 = "DoubletFinder Results",
+        h2 = "Plots"
+    )
+}
 log_info("Saving filtered seurat object ...")
 saveRDS(sobj, rdsfile)

biopipen/scripts/snp/PlinkSimulation.py CHANGED Viewed

@@ -1,88 +1,124 @@
 from pathlib import Path
+from multiprocessing import Pool
+from slugify import slugify
+from simpleconf import Config
 from biopipen.utils.misc import logger, run_command, dict_to_cli_args
-nsnps = {{in.nsnps | repr}}  # pyright: ignore
-ncases = {{in.ncases | repr}}  # pyright: ignore
-nctrls = {{in.nctrls | repr}}  # pyright: ignore
+configfile = {{in.configfile | repr}}  # pyright: ignore # noqa: E999
 outdir = {{out.outdir | repr}}  # pyright: ignore
 gtmatfile = {{out.gtmat | repr}}  # pyright: ignore
-plink = {{envs.plink | repr}}  # pyright: ignore
-seed = {{envs.seed | repr}}  # pyright: ignore
-label = {{envs.label | repr}}  # pyright: ignore
-prevalence = {{envs.prevalence | repr}}  # pyright: ignore
-minfreq = {{envs.minfreq | repr}}  # pyright: ignore
-maxfreq = {{envs.maxfreq | repr}}  # pyright: ignore
-hetodds = {{envs.hetodds | repr}}  # pyright: ignore
-homodds = {{envs.homodds | repr}}  # pyright: ignore
-missing = {{envs.missing | repr}}  # pyright: ignore
-args = {{envs.args | repr}}  # pyright: ignore
-transpose_gtmat = {{envs.transpose_gtmat | repr}}  # pyright: ignore
-sample_prefix = {{envs.sample_prefix | repr}}  # pyright: ignore
-logger.info("Generating parameters file")
-params_file = Path(outdir) / "params.txt"
-params_file.write_text(
-    f"{nsnps}\t{label}\t{minfreq}\t{maxfreq}\t{hetodds}\t{homodds}\n"
-)
-if seed is not None:
-    args["seed"] = seed
-args["simulate"] = params_file
-args["out"] = Path(outdir) / "sim_snps"
-args["simulate-ncases"] = ncases
-args["simulate-ncontrols"] = nctrls
-args["simulate-prevalence"] = prevalence
-args["simulate-missing"] = missing
-cmd = [plink] + dict_to_cli_args(args)
-logger.info("Running PLINK simulation ...")
-run_command(cmd, fg=True)
-# Transpose the genotype matrix
-# CHR	SNP	(C)M	POS	COUNTED	ALT	per0_per0	per1_per1	per2_per2
-# 1	SNP_0	0	1	D	d	1	0	1
-# 1	SNP_1	0	2	d	D	0	1	0
-# 1	SNP_2	0	3	d	D	0	0	0
-# 1	SNP_3	0	4	d	D	0	0	0
-# 1	SNP_4	0	5	D	d	1	2	1
-cmd = [
-    plink,
-    "--recode",
-    "A" if transpose_gtmat else "A-transpose",
-    "tab",
-    "--bfile",
-    args["out"],
-    "--out",
-    gtmatfile + ".plink.recoded",
-]
-logger.info("Recoding into genotype matrix ...")
-run_command(cmd, fg=True)
-logger.info("Saving genotype matrix ...")
-## transpose_gtmat = False
-# SNP_COUNTED	per0_per0	per1_per1	per2_per2
-# SNP_0_D	1	0	1
-# SNP_1_d	0	1	0
-# SNP_2_d	0	0	0
-# SNP_3_d	0	0	0
-# SNP_4_D	1	2	1
-## transpose_gtmat = True
-# FID_IID SNP_0_D SNP_1_D SNP_2_D
-# per0_per0 0 1 1
-# per1_per1 0 2 0
-# per2_per2 0 0 0
-# per3_per3 1 1 0
-# per4_per4 0 0 0
-if transpose_gtmat:
-    cmd = f"cut -f1,2,7- {gtmatfile}.plink.recoded.raw | sed 's/\\t/_/'"
-else:
-    cmd = f"cut -f2,5,7- {gtmatfile}.plink.recoded.traw | sed 's/\\t/_/'"
-if sample_prefix:
-    cmd = f"{cmd} | sed 's/per[0-9]\\+_per/{sample_prefix}/g'"
-cmd = f"{cmd} > {gtmatfile}"
-run_command(cmd, fg=True)
+config = Config.load(configfile)
+default_nsnps = {{envs.nsnps | repr}}  # pyright: ignore
+default_ncases = {{envs.ncases | repr}}  # pyright: ignore
+default_nctrls = {{envs.nctrls | repr}}  # pyright: ignore
+default_plink = {{envs.plink | repr}}  # pyright: ignore
+default_seed = {{envs.seed | repr}}  # pyright: ignore
+default_label = {{envs.label | repr}}  # pyright: ignore
+default_prevalence = {{envs.prevalence | repr}}  # pyright: ignore
+default_minfreq = {{envs.minfreq | repr}}  # pyright: ignore
+default_maxfreq = {{envs.maxfreq | repr}}  # pyright: ignore
+default_hetodds = {{envs.hetodds | repr}}  # pyright: ignore
+default_homodds = {{envs.homodds | repr}}  # pyright: ignore
+default_missing = {{envs.missing | repr}}  # pyright: ignore
+default_args = {{envs.args | repr}}  # pyright: ignore
+default_transpose_gtmat = {{envs.transpose_gtmat | repr}}  # pyright: ignore
+default_sample_prefix = {{envs.sample_prefix | repr}}  # pyright: ignore
+defaults = {
+    "nsnps": default_nsnps,
+    "ncases": default_ncases,
+    "nctrls": default_nctrls,
+    "plink": default_plink,
+    "seed": default_seed,
+    "label": default_label,
+    "prevalence": default_prevalence,
+    "minfreq": default_minfreq,
+    "maxfreq": default_maxfreq,
+    "hetodds": default_hetodds,
+    "homodds": default_homodds,
+    "missing": default_missing,
+    # "args": default_args,
+    "transpose_gtmat": default_transpose_gtmat,
+    "sample_prefix": default_sample_prefix,
+}
+def do_one_simulation(confitems):
+    args = default_args.copy()
+    args.update(confitems.pop("args", {}))
+    confs = defaults.copy()
+    confs.update(confitems)
+    transpose_gtmat = confs.pop("transpose_gtmat")
+    sample_prefix = confs.pop("sample_prefix")
+    logger.debug("  Generating parameters file")
+    params_file = Path(outdir) / "params.txt"
+    params_file.write_text(
+        f"{confs['nsnps']}\t{confs['label']}\t{confs['minfreq']}\t"
+        f"{confs['maxfreq']}\t{confs['hetodds']}\t{confs['homodds']}\n"
+    )
+    if confs.get('seed') is not None:
+        args["seed"] = confs['seed']
+    args["simulate"] = params_file
+    args["out"] = Path(outdir) / "sim_snps"
+    args["simulate-ncases"] = confs['ncases']
+    args["simulate-ncontrols"] = confs['nctrls']
+    args["simulate-prevalence"] = confs['prevalence']
+    args["simulate-missing"] = confs['missing']
+    cmd = [confs['plink']] + dict_to_cli_args(args)
+    logger.debug("  Running PLINK simulation ...")
+    run_command(cmd, fg=True)
+    # Transpose the genotype matrix
+    # CHR	SNP	(C)M	POS	COUNTED	ALT	per0_per0	per1_per1	per2_per2
+    # 1	SNP_0	0	1	D	d	1	0	1
+    # 1	SNP_1	0	2	d	D	0	1	0
+    # 1	SNP_2	0	3	d	D	0	0	0
+    # 1	SNP_3	0	4	d	D	0	0	0
+    # 1	SNP_4	0	5	D	d	1	2	1
+    cmd = [
+        confs['plink'],
+        "--recode",
+        "A" if transpose_gtmat else "A-transpose",
+        "tab",
+        "--bfile",
+        args["out"],
+        "--out",
+        gtmatfile + ".plink.recoded",
+    ]
+    logger.debug("- Recoding into genotype matrix ...")
+    run_command(cmd, fg=True)
+    logger.debug("  Saving genotype matrix ...")
+    ## transpose_gtmat = False
+    # SNP_COUNTED	per0_per0	per1_per1	per2_per2
+    # SNP_0_D	1	0	1
+    # SNP_1_d	0	1	0
+    # SNP_2_d	0	0	0
+    # SNP_3_d	0	0	0
+    # SNP_4_D	1	2	1
+    ## transpose_gtmat = True
+    # FID_IID SNP_0_D SNP_1_D SNP_2_D
+    # per0_per0 0 1 1
+    # per1_per1 0 2 0
+    # per2_per2 0 0 0
+    # per3_per3 1 1 0
+    # per4_per4 0 0 0
+    if transpose_gtmat:
+        cmd = f"cut -f1,2,7- {gtmatfile}.plink.recoded.raw | sed 's/\\t/_/'"
+    else:
+        cmd = f"cut -f2,5,7- {gtmatfile}.plink.recoded.traw | sed 's/\\t/_/'"
+    if sample_prefix:
+        cmd = f"{cmd} | sed 's/per[0-9]\\+_per/{sample_prefix}/g'"
+    cmd = f"{cmd} > {gtmatfile}"
+    run_command(cmd, fg=True)
+do_one_simulation(config)

biopipen/scripts/stats/DiffCoexpr.R CHANGED Viewed

@@ -42,21 +42,21 @@ diffcoex_score <- function(group) {
     gvals <- unique(gdata[, group, drop = TRUE])
     if (length(gvals) < 2) {
-        log_warn("  Less than 2 groups in the input. Skipping ...")
+        log_debug("  Less than 2 groups in the input. Skipping ...")
         return(NULL)
     }
     rs <- lapply(gvals, function(gval) {
         samples <- rownames(gdata[gdata[[group]] == gval, , drop = FALSE])
         expr <- indata[samples, , drop = FALSE]
         if (length(samples) < 3) {
-            log_warn("  Less than 3 samples in one of the groups. Skipping ...")
+            log_debug("  Less than 3 samples in one of the groups. Skipping ...")
             return(NULL)
         }
         cor.pairs(as.matrix(expr), cor.method = method)
     })
     rs[sapply(rs, is.null)] <- NULL
     if (length(rs) < 2) {
-        log_warn("  Less than 2 groups with at least 3 samples. Skipping ...")
+        log_debug("  Less than 2 groups with at least 3 samples. Skipping ...")
         return(NULL)
     }
     N <- length(rs)

biopipen/scripts/tcr/CloneResidency.R CHANGED Viewed

@@ -26,6 +26,7 @@ section <- {{ envs.section | r }}
 mutaters <- {{ envs.mutaters | r }}
 subset <- {{ envs.subset | r }}
 prefix <- {{ envs.prefix | r }}
+upset_ymax <- {{ envs.upset_ymax | r }}
 upset_trans <- {{ envs.upset_trans | r }}
 cases <- {{ envs.cases | r }}
@@ -40,6 +41,7 @@ if (is.null(cases) || length(cases) == 0) {
             order = sample_order,
             subset = subset,
             section = section,
+            upset_ymax = upset_ymax,
             upset_trans = upset_trans
         )
     )
@@ -50,6 +52,7 @@ if (is.null(cases) || length(cases) == 0) {
         cases[[key]]$order <- cases[[key]]$order %||% sample_order
         cases[[key]]$section <- cases[[key]]$section %||% section
         cases[[key]]$subset <- cases[[key]]$subset %||% subset
+        cases[[key]]$upset_ymax <- cases[[key]]$upset_ymax %||% upset_ymax
         cases[[key]]$upset_trans <- cases[[key]]$upset_trans %||% upset_trans
     }
 }
@@ -320,7 +323,7 @@ plot_venndg <- function(counts, groups, singletons) {
     venn_p
 }
-plot_upset <- function(counts, singletons, upset_trans) {
+plot_upset <- function(counts, singletons, upset_ymax, upset_trans) {
     cnts <- column_to_rownames(counts, "CDR3.aa") %>%
         mutate(across(everything(), ~ as.integer(as.logical(.x))))
@@ -345,12 +348,21 @@ plot_upset <- function(counts, singletons, upset_trans) {
             geom_text(
                 aes(label = ..count.., vjust = ifelse(..type == "Multiplets", -0.25, +1.25)),
                 stat = "count", position = "stack", size = 2.8)
+        if (!is.null(upset_ymax)) {
+            p <- p + ylim(0, upset_ymax)
+        }
     } else {
         p <- p + geom_bar(stat = "count", position = "dodge2") +
             geom_text(
                 aes(label = ..count..),
-                stat = "count", position = position_dodge(width = 0.9), vjust = -0.25, size = 2.5) +
-            scale_y_continuous(trans = "log10")
+                stat = "count", position = position_dodge(width = 0.9), vjust = -0.25, size = 2.5)
+        # limit the y and do log10 transformation
+        if (!is.null(upset_ymax)) {
+            p <- p + scale_y_continuous(trans = "log10", limits = c(1, upset_ymax))
+        } else {
+            p <- p + scale_y_continuous(trans = "log10")
+        }
     }
     upset(
@@ -519,7 +531,7 @@ handle_subject <- function(i, subjects, casename, case) {
     upset_dir <- file.path(casedir, "upset")
     upset_png <- file.path(upset_dir, paste0("upset_", slugify(subject), ".png"))
     png(upset_png, res = 100, height = 600, width = 800)
-    print(plot_upset(counts, singletons, case$upset_trans))
+    print(plot_upset(counts, singletons, case$upset_ymax, case$upset_trans))
     dev.off()
     h <- headings(case$section, casename, "Overlapping Clones (UpSet Plots)")

biopipen/scripts/tcr/TCRDock.py ADDED Viewed

@@ -0,0 +1,106 @@
+import os
+import sys
+from pathlib import Path
+import rtoml
+import pandas as pd
+from tempfile import gettempdir
+from biopipen.utils.misc import logger, run_command
+configfile = {{in.configfile | repr}}  # pyright: ignore
+outdir = Path({{out.outdir | repr}})  # pyright: ignore
+envs = {{envs | dict | repr}}  # pyright: ignore
+python = sys.executable
+args = envs.copy()
+config = rtoml.load(Path(configfile))
+args.update(config)
+model_name = args.pop("model_name")
+model_file = Path(args.pop("model_file"))
+data_dir = args.pop("data_dir", None)
+tcrdock = args.pop("tcrdock", None)
+tmpdir = args.pop("tmpdir", gettempdir())
+python = args.pop("python", python)
+if not isinstance(python, (list, tuple)):
+    python = [python]
+if not data_dir:
+    raise ValueError("`envs.data_dir` is required")
+if not tcrdock:
+    logger.info("- `envs.tcrdock` is not provided, cloning the repository ... ")
+    repo_url = "https://github.com/phbradley/TCRdock"
+    commit_id = "c5a7af42eeb0c2a4492a4d4fe803f1f9aafb6193"
+    branch = "main"
+    from git import Repo
+    repo = Repo.clone_from(repo_url, tmpdir, branch=branch, no_checkout=True)
+    repo.git.checkout(commit_id)
+    tcrdock = Path(tmpdir) / "TCRdock"
+    logger.info("- Running download_blast.py ...")
+    cmd = [
+        *python,
+        tcrdock / "download_blast.py",
+    ]
+    run_command(cmd, fg=True, cwd=str(tcrdock))
+if not model_file.is_absolute():
+    model_file = Path(data_dir) / "params" / model_file
+os.environ['TF_FORCE_UNIFIED_MEMORY'] = '1'
+os.environ['XLA_PYTHON_CLIENT_MEM_FRACTION'] = '4.0'
+logger.info("- Composing targets file ... ")
+targets_file = outdir / "user_targets.tsv"
+targets = pd.DataFrame(
+    [
+        dict(
+            organism=args['organism'],
+            mhc_class=args['mhc_class'],
+            mhc=args['mhc'],
+            peptide=args['peptide'],
+            va=args['va'],
+            ja=args['ja'],
+            cdr3a=args['cdr3a'],
+            vb=args['vb'],
+            jb=args['jb'],
+            cdr3b=args['cdr3b'],
+        )
+    ]
+)
+targets.to_csv(targets_file, sep="\t", index=False)
+logger.info("- Generating inputs for AlphaFold modeling ... ")
+cmd = [
+    *python,
+    tcrdock + "/setup_for_alphafold.py",
+    "--targets_tsvfile", targets_file,
+    "--output_dir", outdir / "user_output",
+    "--new_docking",
+]
+run_command(cmd, fg=True)
+logger.info("- Running AlphaFold modeling ... ")
+cmd = [
+    *python,
+    tcrdock + "/run_prediction.py",
+    "--verbose",
+    "--targets", outdir / "user_output/targets.tsv",
+    "--outfile_prefix", f"{outdir}/{args['peptide']}",
+    "--model_names", model_name,
+    "--data_dir", data_dir,
+    "--model_params_files", model_file,
+]
+run_command(cmd, fg=True, env={"XLA_FLAGS": "--xla_gpu_force_compilation_parallelism=1"})
+logger.info("- Calculating the PAE ... ")
+cmd = [
+    *python,
+    tcrdock + "/add_pmhc_tcr_pae_to_tsvfile.py",
+    "--infile", f"{outdir}/{args['peptide']}_final.tsv",
+    "--outfile", f"{outdir}/{args['peptide']}_w_pae.tsv",
+]
+run_command(cmd, fg=True)

biopipen/utils/misc.py CHANGED Viewed

@@ -1,13 +1,14 @@
 from __future__ import annotations
 from pathlib import Path
+import os
 import sys
 import logging
 from typing import List
 from biopipen.core.filters import dict_to_cli_args  # noqa: F401
 logger = logging.getLogger("biopipen_job")
-logger.setLevel(logging.INFO)
+logger.setLevel(logging.DEBUG)
 _handler = logging.StreamHandler(sys.stdout)
 # Use same log format as in R
 # {sprintf("%-7s", level)} [{format(time, "%Y-%m-%d %H:%M:%S")}] {msg}
@@ -100,6 +101,9 @@ def run_command(
         kwargs["stderr"] = sys.stderr
         kwargs["universal_newlines"] = True
+    if "env" in kwargs:
+        kwargs["env"] = {**os.environ, **kwargs["env"]}
     try:
         p = Popen(cmd, **kwargs)
     except Exception as e:

{biopipen-0.27.1.dist-info → biopipen-0.27.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: biopipen
-Version: 0.27.1
+Version: 0.27.3
 Summary: Bioinformatics processes/pipelines that can be run from `pipen run`
 License: MIT
 Author: pwwang
@@ -17,6 +17,7 @@ Requires-Dist: datar[pandas] (>=0.15.6,<0.16.0)
 Requires-Dist: pipen-board[report] (>=0.15,<0.16)
 Requires-Dist: pipen-cli-run (>=0.13,<0.14)
 Requires-Dist: pipen-filters (>=0.12,<0.13)
-Requires-Dist: pipen-poplog (>=0.1,<0.2)
+Requires-Dist: pipen-poplog (>=0.1.2,<0.2.0)
 Requires-Dist: pipen-runinfo (>=0.6,<0.7) ; extra == "runinfo"
 Requires-Dist: pipen-verbose (>=0.11,<0.12)
+Requires-Dist: pyyaml-include (==1.*)

{biopipen-0.27.1.dist-info → biopipen-0.27.3.dist-info}/RECORD RENAMED Viewed

@@ -1,4 +1,4 @@
-biopipen/__init__.py,sha256=lnka9HWRxSmlQAffgSpaSitns-Djhy2OArtj9IVwxrY,23
+biopipen/__init__.py,sha256=lxhjPOOCzhlHB02EzaqTtDdBFZSOLV3WLWw2HC0DYvo,23
 biopipen/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 biopipen/core/config.py,sha256=edK5xnDhM8j27srDzsxubi934NMrglLoKrdcC8qsEPk,1069
 biopipen/core/config.toml,sha256=20RCI30Peee1EQdfb_UbV3Hf74XUPndJnYZlUThytsw,1781
@@ -21,12 +21,12 @@ biopipen/ns/gsea.py,sha256=EsNRAPYsagaV2KYgr4Jv0KCnZGqayM209v4yOGGTIOI,7423
 biopipen/ns/misc.py,sha256=fzn0pXvdghMkQhu-e3MMapPNMyO6IAJbtTzVU3GbFa0,3246
 biopipen/ns/plot.py,sha256=yguxmErUOH-hOM10JfuI_sXw2p49XF8yGR_gXfbd5yQ,4066
 biopipen/ns/rnaseq.py,sha256=bKAa6friFWof4yDTWZQahm1MS-lrdetO1GqDKdfxXYc,7708
-biopipen/ns/scrna.py,sha256=eLCXGyVcgq3vQ-br5SFHHmfIVPaJN4kSFxtCiJiYamg,102716
+biopipen/ns/scrna.py,sha256=i9h0xNOII3SqJ_cJOZ5epn8breAsc-yXH_Us04DoZvg,103401
 biopipen/ns/scrna_metabolic_landscape.py,sha256=9s1NvH3aMaNDXyfwy9TdzGcSP_lIW4JqhLgknNZcIKE,28313
-biopipen/ns/snp.py,sha256=upGltsjjl09PWcRVdW6D5WpAQ3oWm1KwxQ026wsQwWc,2583
+biopipen/ns/snp.py,sha256=Nq20NJzQ9YiqE9mhtCUH6dfs7528o1e4N-j9PewjAsQ,3016
 biopipen/ns/stats.py,sha256=yJ6C1CXF84T7DDs9mgufqUOr89Rl6kybE5ji8Vnx6cw,13693
 biopipen/ns/tcgamaf.py,sha256=AFbUJIxiMSvsVY3RcHgjRFuMnNh2DG3Mr5slLNEyz6o,1455
-biopipen/ns/tcr.py,sha256=uggi21Sfsi0F4TkgZHevRnSzS8m4-zmTWyZU6n7eEvw,84825
+biopipen/ns/tcr.py,sha256=5bMnxhbeB08UrAw8YSh2BkA3AUFeoOajhE6DhHt74K4,87863
 biopipen/ns/vcf.py,sha256=cdkKroii0_nl_bSP2cnO09qESUAhHqu6btOiTSKS79Y,15314
 biopipen/ns/web.py,sha256=3zucrDo-IVsSnIvlw-deoScuxqWa6OMTm8Vo-R4E44Q,2224
 biopipen/reports/bam/CNAClinic.svelte,sha256=D4IxQcgDCPQZMbXog-aZP5iJEQTK2N4i0C60e_iXyfs,213
@@ -129,12 +129,12 @@ biopipen/scripts/scrna/ExprImpution-alra.R,sha256=w3W1txJcdWg52-SETY2Z0lO7maDNfi
 biopipen/scripts/scrna/ExprImpution-rmagic.R,sha256=jYIfqZpnvjKJkvItLnemPVtUApHBYQi1_L8rHVbEe1M,735
 biopipen/scripts/scrna/ExprImpution-scimpute.R,sha256=mg40qCUW7-nP5oHPvARq7dmtoahM0GRFWXQpum0BXVk,1082
 biopipen/scripts/scrna/ExprImpution.R,sha256=7768ezrr59xUZDXq8lO9jj2XhnkSsx-xxBmOD9_DO7c,313
-biopipen/scripts/scrna/MarkersFinder.R,sha256=TvLVozCsgL_R-EMW7SbkCRdpchxt9k7Ewwz5nb3TOYo,22172
-biopipen/scripts/scrna/MetaMarkers.R,sha256=J__ZZ4K4P-Jdty1lZhRldu4rAErLxMtDZkRUlOqZea4,10852
+biopipen/scripts/scrna/MarkersFinder.R,sha256=M7fHTbHHErZ9JbLmjDkx-6yVIay0_h0MkvgFegnqL44,22918
+biopipen/scripts/scrna/MetaMarkers.R,sha256=9ve1X0TrDzS_ZEW6HtU3n8R-uPx7q-hYMMNFVDSE8wQ,11272
 biopipen/scripts/scrna/ModuleScoreCalculator.R,sha256=JSHd-_-KiFqW8avCGxgU4T-C5BtDr2u0kwIvEu2lFIg,4188
-biopipen/scripts/scrna/RadarPlots.R,sha256=uXrX2zTQECTnie4aCOvVvD1_X7Jn3_71I7kwXWeNWlY,13044
+biopipen/scripts/scrna/RadarPlots.R,sha256=TGPUTUcHOHgd9rsNtLYT-N6WHiFNDBZsiIoqkyAJh0A,13020
 biopipen/scripts/scrna/SCImpute.R,sha256=dSJOHhmJ3x_72LBRXT72dbCti5oiB85CJ-OjWtqONbk,2958
-biopipen/scripts/scrna/ScFGSEA.R,sha256=M6YeqUNa_0bq1qmL8dutQR3o5v2jy_gICCLaWw5c3A4,5738
+biopipen/scripts/scrna/ScFGSEA.R,sha256=2UCTCIydVkPGvn7WP-_fcE7857iKKDxY56-j-ruyO8o,6254
 biopipen/scripts/scrna/Seurat2AnnData.R,sha256=qz4u-B5J3GMwttubnNnByJXreziFbrP5Mak0L0q7eG0,1557
 biopipen/scripts/scrna/SeuratClusterStats-dimplots.R,sha256=gViDgQ8NorYD64iK0FgcODOrDOw0tExZmhuPRuLNp4g,2354
 biopipen/scripts/scrna/SeuratClusterStats-features.R,sha256=SaKTJloP1fttRXZQeb2ApX0ej7al13wOoEYkthSk13k,15489
@@ -147,7 +147,7 @@ biopipen/scripts/scrna/SeuratFilter.R,sha256=BrYK0MLdaTtQvInMaQsmOt7oH_hlks0M1zy
 biopipen/scripts/scrna/SeuratLoading.R,sha256=ekWKnHIqtQb3kHVQiVymAHXXqiUxs6KKefjZKjaykmk,900
 biopipen/scripts/scrna/SeuratMap2Ref.R,sha256=Xn3VnvKqShuC0Ju05380wjuLVSdW0uWVzntdxjme244,4359
 biopipen/scripts/scrna/SeuratMetadataMutater.R,sha256=Pp4GsF3hZ6ZC2vroC3LSBmVa4B1p2L3hbh981yaAIeQ,1093
-biopipen/scripts/scrna/SeuratPreparing.R,sha256=cgXWon2it6g4y-yrYk_zhivViOX8ZVf36u3wb9lKtj0,13133
+biopipen/scripts/scrna/SeuratPreparing.R,sha256=c_aBM0mugBNyYJ5OjNVDR_Cj0sGqkiJZXCOk3pesFDk,16990
 biopipen/scripts/scrna/SeuratSplit.R,sha256=vdK11V39_Uo_NaOh76QWCtxObGaEr5Ynxqq0hTiSvsU,754
 biopipen/scripts/scrna/SeuratSubClustering.R,sha256=L1SwKhNNKvsQGrcj0ZjScW9BLuvdO2pg7U48Ospsot8,6096
 biopipen/scripts/scrna/SeuratSubset.R,sha256=yVA11NVE2FSSw-DhxQcJRapns0tNNHdyDYi5epO6SKM,1776
@@ -160,9 +160,9 @@ biopipen/scripts/scrna_metabolic_landscape/MetabolicFeatures.R,sha256=b77yG5FeRs
 biopipen/scripts/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.R,sha256=ic8Fy8QqYDGh_izmvZVJ3KL66podg_CSF5ITL3FZsvo,5196
 biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayActivity.R,sha256=95DLX1Rz0tobOuDZ8V9YdGgO0KiNthhccoeeOK21tno,16216
 biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.R,sha256=rQ9iwGh9FNRZlJJzM4QItdyXmebfzLAq05ZAjb1kGUw,9831
-biopipen/scripts/snp/PlinkSimulation.py,sha256=h5ZArLGi45ZNrhuW1ExyJ7-4BQ7tbucmwn63BktN5pU,2667
+biopipen/scripts/snp/PlinkSimulation.py,sha256=mSSoGGG6sbEPBcUGdHgbebUrg4DiHeyNyc7jLPjV5pY,4169
 biopipen/scripts/stats/ChowTest.R,sha256=4p7NULmfOZSfeBSQ04els0h3cXOK5yeCJJ4-gEBPOGk,3617
-biopipen/scripts/stats/DiffCoexpr.R,sha256=rSxNf_nhyviubGknyHFkyIY0PlXIRfqYUDbZIoTrk0c,4513
+biopipen/scripts/stats/DiffCoexpr.R,sha256=5hQDV2_7bKdKUsOGMZUa0GS5rc7kFspxonNyFEPmtbc,4516
 biopipen/scripts/stats/LiquidAssoc.R,sha256=s-XJbFoOfH4eWSkxbbOSHZ1x16lY0Sdod_V1KvSkM8k,3727
 biopipen/scripts/stats/MetaPvalue.R,sha256=c26lYC4rxQ3D7vRvsXJ4_M-QIYTDTV8AEjXrag2_srU,3957
 biopipen/scripts/tcgamaf/Maf2Vcf.py,sha256=Cxh7fiSNCxWDTfIJqZDOOnaSrw-85S_fH2U-PWY03hc,704
@@ -170,7 +170,7 @@ biopipen/scripts/tcgamaf/MafAddChr.py,sha256=V10HMisl12O3ZfXuRmFNdy5p-3mr43WCvy0
 biopipen/scripts/tcgamaf/maf2vcf.pl,sha256=hJKcH-NbgWK6fmK7f3qex7ozJJl-PqCNPXqpwfcHwJg,22707
 biopipen/scripts/tcr/Attach2Seurat.R,sha256=C91TAh1cLSxWkdFPf84pbxlpTYMuWq_rduG4eiIkXZI,1345
 biopipen/scripts/tcr/CDR3AAPhyschem.R,sha256=-0BS6cdt5GfQJphA3HlDgGjWr4XFF-7INLJyMBHQNAc,16628
-biopipen/scripts/tcr/CloneResidency.R,sha256=2_GC2snbFsoYf9AzFPkAttabp4HmT_EIsolGbq5HEOY,21047
+biopipen/scripts/tcr/CloneResidency.R,sha256=nFPPPknJPEX-RU16uqQZzYMmJqmWqUAun_FI8GpJ7iw,21520
 biopipen/scripts/tcr/CloneSizeQQPlot.R,sha256=5FPfWQjxTsv59KSDQaDWj3C95zPQMngKG7qOf95NEzI,4527
 biopipen/scripts/tcr/GIANA/GIANA.py,sha256=0qLhgCWxT8K-4JvORA03CzBPTT5pd4Di5B_DgrHXbFA,47198
 biopipen/scripts/tcr/GIANA/GIANA4.py,sha256=Z7Q3cUr1Pvmy4CFADN0P7i9g1-HbzWROMqk5HvL_F1Q,45762
@@ -193,6 +193,7 @@ biopipen/scripts/tcr/ImmunarchSplitIdents.R,sha256=FGCeGV0uSmFU91lKkldUAeV4A2m3h
 biopipen/scripts/tcr/SampleDiversity.R,sha256=jQ1OU3b8vswD8tZhLt3fkcqJKrl2bhQX0giHM2rXz3Y,2643
 biopipen/scripts/tcr/TCRClusterStats.R,sha256=D7q1svXQxl1uOya8bePvR9e6NJXjCjXbPsXnEPTWdlE,12004
 biopipen/scripts/tcr/TCRClustering.R,sha256=eflUsYfq4aEaX9BVL0MiB7lNlot_L-8VaReK516go84,9236
+biopipen/scripts/tcr/TCRDock.py,sha256=jjzxMWp-hs0LDtA1mVbiWDvUieSO7X-F9yeKGy1LSTM,3026
 biopipen/scripts/tcr/TESSA.R,sha256=bfOixWLZy8yi0MzXncP67KjtCukwXEzsK5fCdMzB5VM,6822
 biopipen/scripts/tcr/TESSA_source/Atchley_factors.csv,sha256=SumqDOqP67P54uM7Cuc5_O_rySTWcGo7eX3psMSPX9s,763
 biopipen/scripts/tcr/TESSA_source/BriseisEncoder.py,sha256=z4_Q_6StymffuUGGjHP1-B3aTsXtamKao5Q1-Kg9has,6831
@@ -230,14 +231,14 @@ biopipen/utils/gene.py,sha256=qE_BqTayrJWxRdniffhcz6OhZcw9GUoOrj2EtFWH9Gw,2246
 biopipen/utils/gsea.R,sha256=UMQOlWGstQTOBScvy1wIzrB7I3CE28Xo2v1sy4lmJ-M,7549
 biopipen/utils/io.R,sha256=jIYdqdn0iRWfQYAZa5CjXi3fikqmYvPPLIXhobRe8sw,537
 biopipen/utils/misc.R,sha256=jXusPDCxSIaYRq_qm4khUsu9nyMhbpBVcj8BVn4j8Ic,10629
-biopipen/utils/misc.py,sha256=BpqPVgp_IlsUZow5P4mEtbPMjhO_vEb5atrF7iJ_xhU,3509
+biopipen/utils/misc.py,sha256=KJziAFY4Kl-0ZsO93vteY9gRLZg9BSYig-TDocHY36k,3601
 biopipen/utils/mutate_helpers.R,sha256=Bqy6Oi4rrPEPJw0Jq32bVAwwBfZv7JJL9jFcK5x-cek,17649
 biopipen/utils/plot.R,sha256=pzl37PomNeUZPxohHZ2w93j3Fc4T0Qrc62FF-9MTKdw,4417
 biopipen/utils/reference.py,sha256=6bPSwQa-GiDfr7xLR9a5T64Ey40y24yn3QfQ5wDFZkU,4420
 biopipen/utils/rnaseq.R,sha256=Ro2B2dG-Z2oVaT5tkwp9RHBz4dp_RF-JcizlM5GYXFs,1298
 biopipen/utils/single_cell.R,sha256=pJjYP8bIZpNAtTQ32rOXhZxaM1Y-6D-xUcK3pql9tbk,4316
 biopipen/utils/vcf.py,sha256=ajXs0M_QghEctlvUlSRjWQIABVF02wPdYd-0LP4mIsU,9377
-biopipen-0.27.1.dist-info/METADATA,sha256=qF5h3mchRggnLrHS421nr82vFQao-82FEarAbk-HeK0,878
-biopipen-0.27.1.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-biopipen-0.27.1.dist-info/entry_points.txt,sha256=wu70aoBcv1UahVbB_5237MY-9M9_mzqmWjDD-oi3yz0,621
-biopipen-0.27.1.dist-info/RECORD,,
+biopipen-0.27.3.dist-info/METADATA,sha256=4DeAjhBZHdg7pZXoTNPiQkzGsx6hSm7VwgWgyYKMY18,920
+biopipen-0.27.3.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+biopipen-0.27.3.dist-info/entry_points.txt,sha256=wu70aoBcv1UahVbB_5237MY-9M9_mzqmWjDD-oi3yz0,621
+biopipen-0.27.3.dist-info/RECORD,,

{biopipen-0.27.1.dist-info → biopipen-0.27.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{biopipen-0.27.1.dist-info → biopipen-0.27.3.dist-info}/entry_points.txt RENAMED Viewed

File without changes

biopipen 0.27.1__py3-none-any.whl → 0.27.3__py3-none-any.whl

Potentially problematic release.

biopipen 0.27.1py3-none-any.whl → 0.27.3py3-none-any.whl