RubyGems - miga-base - Versions diffs - 0.4.3.0 → 0.5.0.0 - Mend

miga-base 0.4.3.0 → 0.5.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (120) hide show

checksums.yaml +4 -4
data/README.md +1 -1
data/lib/miga/cli.rb +43 -223
data/lib/miga/cli/action/add.rb +91 -62
data/lib/miga/cli/action/classify_wf.rb +97 -0
data/lib/miga/cli/action/daemon.rb +14 -10
data/lib/miga/cli/action/derep_wf.rb +95 -0
data/lib/miga/cli/action/doctor.rb +83 -55
data/lib/miga/cli/action/get.rb +68 -52
data/lib/miga/cli/action/get_db.rb +206 -0
data/lib/miga/cli/action/index_wf.rb +31 -0
data/lib/miga/cli/action/init.rb +115 -190
data/lib/miga/cli/action/init/daemon_helper.rb +124 -0
data/lib/miga/cli/action/ls.rb +20 -11
data/lib/miga/cli/action/ncbi_get.rb +199 -157
data/lib/miga/cli/action/preproc_wf.rb +46 -0
data/lib/miga/cli/action/quality_wf.rb +45 -0
data/lib/miga/cli/action/stats.rb +147 -99
data/lib/miga/cli/action/summary.rb +10 -4
data/lib/miga/cli/action/tax_dist.rb +61 -46
data/lib/miga/cli/action/tax_test.rb +46 -39
data/lib/miga/cli/action/wf.rb +178 -0
data/lib/miga/cli/base.rb +11 -0
data/lib/miga/cli/objects_helper.rb +88 -0
data/lib/miga/cli/opt_helper.rb +160 -0
data/lib/miga/daemon.rb +7 -4
data/lib/miga/dataset/base.rb +5 -5
data/lib/miga/project/base.rb +4 -4
data/lib/miga/project/result.rb +2 -1
data/lib/miga/remote_dataset/base.rb +5 -5
data/lib/miga/remote_dataset/download.rb +1 -1
data/lib/miga/version.rb +3 -3
data/scripts/cds.bash +3 -1
data/scripts/essential_genes.bash +1 -0
data/scripts/stats.bash +1 -1
data/scripts/trimmed_fasta.bash +5 -3
data/utils/distance/runner.rb +3 -0
data/utils/distance/temporal.rb +10 -1
data/utils/enveomics/Manifest/Tasks/fasta.json +5 -0
data/utils/enveomics/Manifest/Tasks/sequence-identity.json +7 -0
data/utils/enveomics/Scripts/BlastTab.addlen.rb +33 -31
data/utils/enveomics/Scripts/FastA.tag.rb +42 -41
data/utils/enveomics/Scripts/HMM.essential.rb +85 -55
data/utils/enveomics/Scripts/HMM.haai.rb +29 -20
data/utils/enveomics/Scripts/SRA.download.bash +1 -1
data/utils/enveomics/Scripts/aai.rb +163 -128
data/utils/enveomics/build_enveomics_r.bash +11 -10
data/utils/enveomics/enveomics.R/DESCRIPTION +3 -2
data/utils/enveomics/enveomics.R/R/autoprune.R +141 -107
data/utils/enveomics/enveomics.R/R/barplot.R +105 -86
data/utils/enveomics/enveomics.R/R/cliopts.R +131 -115
data/utils/enveomics/enveomics.R/R/df2dist.R +144 -106
data/utils/enveomics/enveomics.R/R/growthcurve.R +201 -133
data/utils/enveomics/enveomics.R/R/recplot.R +350 -315
data/utils/enveomics/enveomics.R/R/recplot2.R +1334 -914
data/utils/enveomics/enveomics.R/R/tribs.R +521 -361
data/utils/enveomics/enveomics.R/R/utils.R +31 -15
data/utils/enveomics/enveomics.R/README.md +7 -0
data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +17 -0
data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +17 -0
data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +17 -0
data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +16 -21
data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +31 -28
data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +23 -19
data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +36 -26
data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +23 -24
data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +23 -24
data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +32 -33
data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +91 -64
data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +57 -37
data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +24 -19
data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +19 -18
data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +39 -26
data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +38 -25
data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +40 -26
data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +67 -49
data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +37 -28
data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +122 -97
data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +35 -31
data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +24 -23
data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +68 -51
data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +25 -24
data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +21 -22
data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +19 -20
data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +19 -18
data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +41 -32
data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +29 -24
data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +18 -18
data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +40 -34
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +36 -24
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +19 -20
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +19 -20
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +27 -29
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +41 -42
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +17 -18
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +43 -33
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +36 -28
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +74 -56
data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +44 -31
data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +27 -22
data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +32 -26
data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +59 -44
data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +28 -21
data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +27 -22
data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +63 -43
data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +38 -29
data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +38 -30
data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +111 -83
data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +19 -18
data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +19 -18
data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +19 -18
data/utils/find-medoid.R +3 -2
data/utils/representatives.rb +5 -3
data/utils/subclade/pipeline.rb +22 -11
data/utils/subclade/runner.rb +5 -1
data/utils/subclades-compile.rb +1 -1
data/utils/subclades.R +9 -3
metadata +15 -4
data/utils/enveomics/enveomics.R/man/enveomics.R-package.Rd +0 -15
data/utils/enveomics/enveomics.R/man/z$-methods.Rd +0 -26

data/utils/enveomics/enveomics.R/R/growthcurve.R CHANGED

@@ -1,74 +1,105 @@
 #==============> Define S4 classes
-setClass("enve.GrowthCurve",
-  ### Enve-omics representation of fitted growth curves.
-  representation(
-  design  = "array", ##<< Experimental design of the experiment.
-  models  = "list",  ##<< Fitted growth curve models.
-  predict = "list",  ##<< Fitted growth curve values.
-  call='call')       ##<< Call producing this object.
-  ,package='enveomics.R');
+#' Enveomics: Growth Curve S4 Class
+#'
+#' Enve-omics representation of fitted growth curves.
+#'
+#' @slot design \code{(array)} Experimental design of the experiment.
+#' @slot models \code{(list)} Fitted growth curve models.
+#' @slot predict \code{(list)} Fitted growth curve values.
+#' @slot call \code{(call)} Call producing this object.
+#'
+#' @author Luis M. Rodriguez-R [aut, cre]
+#'
+#' @exportClass
+enve.GrowthCurve <- setClass("enve.GrowthCurve",
+                             representation(
+                               design  = "array",
+                               models  = "list",
+                               predict = "list",
+                               call='call')
+                             ,package='enveomics.R');
+#' Attribute accessor
+#'
+#' @param x Object
+#' @param name Attribute name
 setMethod("$", "enve.GrowthCurve", function(x, name) attr(x, name))
+#' Enveomics: Plot of Growth Curve
+#'
+#' Plots an \code{\link{enve.GrowthCurve}} object.
+#'
+#' @param x An \code{\link{enve.GrowthCurve}} object to plot.
+#' @param col Base colors to use for the different samples. Can be recycled.
+#' By default, grey for one sample or rainbow colors for more than one.
+#' @param pt.alpha Color alpha for the observed data points, using \code{col}
+#' as a base.
+#' @param ln.alpha Color alpha for the fitted growth curve, using \code{col}
+#' as a base.
+#' @param ln.lwd Line width for the fitted curve.
+#' @param ln.lty Line type for the fitted curve.
+#' @param band.alpha Color alpha for the confidence interval band of the
+#' fitted growth curve, using \code{col} as a base.
+#' @param band.density Density of the filling pattern in the interval band.
+#' If \code{NULL}, a solid color is used.
+#' @param band.angle Angle of the density filling pattern in the interval
+#' band. Ignored if \code{band.density} is \code{NULL}.
+#' @param xp.alpha Color alpha for the line connecting individual experiments,
+#' using \code{col} as a base.
+#' @param xp.lwd Width of line for the experiments.
+#' @param xp.lty Type of line for the experiments.
+#' @param pch Point character for observed data points.
+#' @param new Should a new plot be generated? If \code{FALSE}, the existing
+#' canvas is used.
+#' @param legend Should the plot include a legend? If \code{FALSE}, no legend
+#' is added. If \code{TRUE}, a legend is added in the bottom-right corner.
+#' Otherwise, a legend is added in the position specified as \code{xy.coords}.
+#' @param add.params Should the legend include the parameters of the fitted
+#' model?
+#' @param ... Any other graphic parameters.
+#'
+#' @author Luis M. Rodriguez-R [aut, cre]
+#'
+#' @method plot enve.GrowthCurve
+#' @export
 #==============> Define S4 methods
 plot.enve.GrowthCurve <- function
-  ### Plots an `enve.GrowthCurve` object.
-    (x,
-    ### `enve.GrowthCurve` object to plot.
-    col,
-    ### Base colors to use for the different samples. Can be recycled. By
-    ### default, grey for one sample or rainbow colors for more than one.
-    pt.alpha=0.9,
-    ### Color alpha for the observed data points, using `col` as a base.
-    ln.alpha=1.0,
-    ### Color alpha for the fitted growth curve, using `col` as a base.
-    ln.lwd=1,
-    ### Line width for the fitted curve.
-    ln.lty=1,
-    ### Line type for the fitted curve.
-    band.alpha=0.4,
-    ### Color alpha for the confidence interval band of the fitted growth curve,
-    ### using `col` as a base.
-    band.density=NULL,
-    ### Density of the filling pattern in the interval band. If NULL, a solid
-    ### color is used.
-    band.angle=45,
-    ### Angle of the density filling pattern in the interval band. Ignored if
-    ### `band.density` is NULL.
-    xp.alpha=0.5,
-    ### Color alpha for the line connecting individual experiments, using `col`
-    ### as a base.
-    xp.lwd=1,
-    ### Width of line for the experiments.
-    xp.lty=1,
-    ### Type of line for the experiments.
-    pch=19,
-    ### Point character for observed data points.
-    new=TRUE,
-    ### Should a new plot be generated? If FALSE, the existing canvas is used.
-    legend=new,
-    ### Should the plot include a legend? If FALSE, no legend is added. If TRUE,
-    ### a legend is added in the bottom-right corner. Otherwise, a legend is
-    ### added in the position specified as `xy.coords`.
-    add.params=FALSE,
-    ### Should the legend include the parameters of the fitted model?
-    ...
-    ### Any other graphic parameters.
-  ){
+(x,
+ col,
+ pt.alpha=0.9,
+ ln.alpha=1.0,
+ ln.lwd=1,
+ ln.lty=1,
+ band.alpha=0.4,
+ band.density=NULL,
+ band.angle=45,
+ xp.alpha=0.5,
+ xp.lwd=1,
+ xp.lty=1,
+ pch=19,
+ new=TRUE,
+ legend=new,
+ add.params=FALSE,
+ ...
+){
   # Arguments
   if(missing(col)){
     col <-
       if(length(x$design)==0) grey(0.2)
-      else rainbow(length(x$design), v=3/5, s=3/5)
+    else rainbow(length(x$design), v=3/5, s=3/5)
   }
   if(new){
     # Initiate canvas
     od.fit.max <- max(sapply(x$predict, function(x) max(x[,"upr"])))
     od.obs.max <- max(sapply(x$models, function(x) max(x$data[,"od"])))
     opts <- list(...)
     plot.defaults <- list(xlab="Time", ylab="Density",
-      xlim=range(x$predict[[1]][,"t"]), ylim=c(0, max(od.fit.max, od.obs.max)))
+                          xlim=range(x$predict[[1]][,"t"]), ylim=c(0, max(od.fit.max, od.obs.max)))
     for(i in names(plot.defaults)){
       if(is.null(opts[[i]])) opts[[i]] <- plot.defaults[[i]]
     }
@@ -76,7 +107,7 @@ plot.enve.GrowthCurve <- function
     opts[["type"]] <- "n"
     do.call(plot, opts)
   }
   # Graphic default
   pch <- rep(pch, length.out=length(x$design))
   col <- rep(col, length.out=length(x$design))
@@ -102,8 +133,8 @@ plot.enve.GrowthCurve <- function
       d <- x$predict[[i]]
       lines(d[,"t"], d[,"fit"], col=ln.col[i], lwd=ln.lwd, lty=ln.lty)
       polygon(c(d[,"t"], rev(d[,"t"])), c(d[,"lwr"], rev(d[,"upr"])),
-        border=NA, col=band.col[i], density=band.density[i],
-        angle=band.angle[i])
+              border=NA, col=band.col[i], density=band.density[i],
+              angle=band.angle[i])
     }
   }
@@ -113,87 +144,117 @@ plot.enve.GrowthCurve <- function
     if(add.params){
       for(p in names(coef(x$models[[1]]))){
         legend.txt <- paste(legend.txt, ", ", p, "=",
-          sapply(x$models, function(x) signif(coef(x)[p],2)) , sep="")
+                            sapply(x$models, function(x) signif(coef(x)[p],2)) , sep="")
       }
     }
     legend(legend, legend=legend.txt, pch=pch, col=ln.col)
   }
 }
-summary.enve.GrowthCurve <- function(
-    ### Summary of an `enve.GrowthCurve` object.
-    object,
-    ### `enve.GrowthCurve` object.
-    ...
-    ### No additional parameters are currently supported.
-  ){
+#' Enveomics: Summary of Growth Curve
+#'
+#' Summary of an \code{\link{enve.GrowthCurve}} object.
+#'
+#' @param object An \code{\link{enve.GrowthCurve}} object.
+#' @param ... No additional parameters are currently supported.
+#'
+#' @author Luis M. Rodriguez-R [aut, cre]
+#'
+#' @method summary enve.GrowthCurve
+#' @export
+summary.enve.GrowthCurve <- function(
+  object,
+  ...
+){
   x <- object
   cat('===[ enve.GrowthCurves ]------------------\n')
   for(i in names(x$design)){
-     cat(i, ':\n', sep='')
-     if(x$models[[i]]$convInfo$isConv){
-       for(j in names(coef(x$models[[i]]))){
-         cat('  - ', j, ' = ', coef(x$models[[i]])[j], '\n', sep='')
-       }
-     }else{
-       cat('  Model didn\'t converge:\n    ',
-         x$models[[i]]$convInfo$stopMessage, '\n', sep='')
-     }
-     cat('  ', nrow(x$models[[i]]$data), ' observations, ',
-       length(unique(x$models[[i]]$data[,"replicate"])), ' replicates.\n',
-       sep='')
+    cat(i, ':\n', sep='')
+    if(x$models[[i]]$convInfo$isConv){
+      for(j in names(coef(x$models[[i]]))){
+        cat('  - ', j, ' = ', coef(x$models[[i]])[j], '\n', sep='')
+      }
+    }else{
+      cat('  Model didn\'t converge:\n    ',
+          x$models[[i]]$convInfo$stopMessage, '\n', sep='')
+    }
+    cat('  ', nrow(x$models[[i]]$data), ' observations, ',
+        length(unique(x$models[[i]]$data[,"replicate"])), ' replicates.\n',
+        sep='')
   }
   cat('------------------------------------------\n')
   cat('call:',as.character(attr(x,'call')),'\n')
   cat('------------------------------------------\n')
 }
+#' Enveomics: Growth Curve
+#'
+#' Calculates growth curves using the logistic growth function.
+#'
+#' @param x Data frame (or coercible) containing the observed growth data
+#' (e.g., O.D. values). Each column is an independent growth curve and each
+#' row is a time point. \code{NA}'s are allowed.
+#' @param times Vector with the times at which each row was taken. By default,
+#' all rows are assumed to be part of constantly periodic measurements.
+#' @param triplicates If \code{TRUE}, the columns are assumed to be sorted by
+#' sample with three replicates by sample. It requires a number of columns
+#' multiple of 3.
+#' @param design Experimental design of the data. An \strong{array} of mode list
+#' with sample names as index and the list of column names in each sample as
+#' the values. By default, each column is assumed to be an independent sample
+#' if \code{triplicates} is \code{FALSE}, or every three columns are assumed
+#' to be a sample if \code{triplicates} is \code{TRUE}. In the latter case,
+#' samples are simply numbered.
+#' @param new.times Values of time for the fitted curve.
+#' @param level Confidence (or prediction) interval in the fitted curve.
+#' @param interval Type of interval to be calculated for the fitted curve.
+#' @param plot Should the growth curve be plotted?
+#' @param FUN Function to fit. By default: logistic growth with paramenters
+#' \code{K}: carrying capacity,
+#' \code{r}: intrinsic growth rate, and
+#' \code{P0}: Initial population.
+#' @param nls.opt Any additional options passed to \code{nls}.
+#' @param ... Any additional parameters to be passed to
+#' \code{plot.enve.GrowthCurve}.
+#'
+#' @return Returns an \code{\link{enve.GrowthCurve}} object.
+#'
+#' @author Luis M. Rodriguez-R [aut, cre]
+#'
+#' @examples
+#' # Load data
+#' data("growth.curves", package="enveomics.R", envir=environment())
+#' # Generate growth curves with different colors
+#' g <- enve.growthcurve(growth.curves[,-1], growth.curves[,1], triplicates=TRUE)
+#' # Generate black-and-white growth curves with different symbols
+#' plot(g, pch=15:17, col="black", band.density=45, band.angle=c(-45,45,0))
+#'
+#' @export
 #==============> Core functions
 enve.growthcurve <- structure(function(
-  ### Calculates growth curves using the logistic growth function.
-    x,
-    ### Data frame (or coercible) containing the observed growth data (e.g.,
-    ### O.D. values). Each column is an independent growth curve and each
-    ### row is a time point. NA's are allowed.
-    times=1:nrow(x),
-    ### Vector with the times at which each row was taken. By default, all
-    ### rows are assumed to be part of constantly periodic measurements.
-    triplicates=FALSE,
-    ### If TRUE, the columns are assumed to be sorted by sample with three
-    ### replicates by sample. It requires a number of columns multiple of 3.
-    design,
-    ### Experimental design of the data. An `array` of mode list with sample
-    ### names as index and the list of column names in each sample as the
-    ### values. By default, each column is assumed to be an independent sample
-    ### if `triplicates` is FALSE, or every three columns are assumed to be a
-    ### sample if `triplicates` is TRUE. In the latter case, samples are
-    ### simply numbered.
-    new.times=seq(min(times), max(times), length.out=length(times)*10),
-    ### Values of time for the fitted curve.
-    level=0.95,
-    ### Confidence (or prediction) interval in the fitted curve.
-    interval=c("confidence","prediction"),
-    ### Type of interval to be calculated for the fitted curve.
-    plot=TRUE,
-    ### Should the growth curve be plotted?
-    FUN=function(t,K,r,P0) K*P0*exp(r*t)/(K+P0*(exp(r*t)-1)),
-    ### Function to fit. By default: logistic growth with paramenters `K`:
-    ### carrying capacity, `r`: intrinsic growth rate, and `P0`: Initial
-    ### population.
-    nls.opt=list(),
-    ### Any additional options passed to `nls`.
-    ...
-    ### Any additional parameters to be passed to `plot.enve.GrowthCurve`.
-  ){
+  x,
+  times=1:nrow(x),
+  triplicates=FALSE,
+  design,
+  new.times=seq(min(times), max(times), length.out=length(times)*10),
+  level=0.95,
+  interval=c("confidence","prediction"),
+  plot=TRUE,
+  FUN=function(t,K,r,P0) K*P0*exp(r*t)/(K+P0*(exp(r*t)-1)),
+  nls.opt=list(),
+  ...
+){
   # Arguments
   if(missing(design)){
     design <-
       if(triplicates)
         tapply(colnames(x), colnames(x)[rep(1:(ncol(x)/3)*3-2, each=3)], c,
-          simplify=FALSE)
-      else tapply(colnames(x), colnames(x), c, simplify=FALSE)
+               simplify=FALSE)
+    else tapply(colnames(x), colnames(x), c, simplify=FALSE)
   }
   mod <- list()
   fit <- list()
@@ -207,18 +268,18 @@ enve.growthcurve <- structure(function(
       od <- c(od, x[,col])
     }
     data <- data.frame(t=rep(times, length(design[[sample]])), od=od,
-      replicate=rep(1:length(design[[sample]]), each=length(times)))
+                       replicate=rep(1:length(design[[sample]]), each=length(times)))
     data <- data[!is.na(data$od),]
     opts <- nls.opt
     opts[["data"]] <- data
     opt.defaults <- list(formula = od ~ enve._growth.fx(t, K, r, P0),
-      algorithm="port", lower=list(P0=1e-16),
-      control=nls.control(warnOnly=TRUE),
-      start=list(
-        K  = 2*max(data$od),
-        r  = length(times)/max(data$t),
-        P0 = min(data$od[data$od>0])
-      ))
+                         algorithm="port", lower=list(P0=1e-16),
+                         control=nls.control(warnOnly=TRUE),
+                         start=list(
+                           K  = 2*max(data$od),
+                           r  = length(times)/max(data$t),
+                           P0 = min(data$od[data$od>0])
+                         ))
     for(i in names(opt.defaults)){
       if(is.null(opts[[i]])){
         opts[[i]] <- opt.defaults[[i]]
@@ -226,16 +287,15 @@ enve.growthcurve <- structure(function(
     }
     mod[[sample]] <- do.call(nls, opts)
     fit[[sample]] <- cbind(t=new.times,
-      predFit(mod[[sample]], level=level, interval=interval,
-        newdata=data.frame(t=new.times)))
+                           predFit(mod[[sample]], level=level, interval=interval,
+                                   newdata=data.frame(t=new.times)))
   }
   enve._growth.fx <<- NULL
   gc <- new("enve.GrowthCurve",
-    design=design, models=mod, predict=fit,
-    call=match.call());
+            design=design, models=mod, predict=fit,
+            call=match.call());
   if(plot) plot(gc, ...);
   return(gc)
-  ### Returns an `enve.GrowthCurve` object.
 }, ex=function(){
   # Load data
   data("growth.curves", package="enveomics.R", envir=environment())
@@ -245,13 +305,21 @@ enve.growthcurve <- structure(function(
   plot(g, pch=15:17, col="black", band.density=45, band.angle=c(-45,45,0))
 });
+#' Enveomics: Color to Alpha
+#'
+#' Takes a vector of colors and sets the alpha.
+#'
+#' @param x A vector of any value base colors.
+#' @param alpha Alpha level to set (in the 0-1 range).
+#'
+#' @author Luis M. Rodriguez-R [aut, cre]
+#'
+#' @export
 enve.col2alpha <- function(
-    ### Takes a vector of colors and sets the alpha.
-    x,
-    ### A vector of any value base colors.
-    alpha
-    ### Alpha level to set (in the 0-1 range).
-    ){
+  x,
+  alpha
+){
   out <- c()
   for(i in x){
     opt <- as.list(col2rgb(i)[,1]/256)

data/utils/enveomics/enveomics.R/R/recplot.R CHANGED

@@ -1,319 +1,354 @@
-enve.recplot <- structure(function(
-	### Produces recruitment plots provided that BlastTab.catsbj.pl has
-	### been previously executed. Requires the gplots library.
-	prefix,
-	### Path to the prefix of the BlastTab.catsbj.pl output files. At
-	### least the files .rec and .lim must exist with this prefix.
-	# Id. hist.
-	id.min=NULL,
-	### Minimum identity to be considered. By default, the minimum detected
-	### identity. This value is a percentage.
-	id.max=NULL,
-	### Maximum identity to be considered. By default, 100.
-	id.binsize=NULL,
-	### Size of the identity bins (vertical histograms). By default, 0.1 for
-	### identity metrics and 5 for bit score.
-	id.splines=0,
-	### Smoothing parameter for the splines in the identity histogram. Zero (0) for no
-	### splines. A generally good value is 1/2. If non-zero, requires the stats package.
-	id.metric='id',
-	### Metric of identity to be used (Y-axis). It can be any unambiguous prefix
-	### of "identity", "corrected identity", or "bit score".
-	id.summary='sum',
-	### Method used to build the identity histogram (Horizontal axis of the right panel).
-	### It can be any unambiguous prefix of "sum", "average", "median", "90% lower bound",
-	### "90% upper bound", "95% lower bound", and "95% upper bound". The last four options
-	### correspond to the upper and lower boundaries of the 90% and 95% empirical confidence
-	### intervals.
-	# Pos. hist.
-	pos.min=1,
-	### Minimum (leftmost) position in the reference (concatenated) genome (in bp).
-	pos.max=NULL,
-	### Maximum (rightmost) position in the reference (concatenated) genome (in bp).
-	### By default: Length of the genome.
-	pos.binsize=1e3,
-	### Size of the position bins (horizontal histograms) in bp.
-	pos.splines=0,
-	### Smoothing parameter for the splines in the position histogram. Zero (0) for no splines.
-	### If non-zero, requires the stats package.
-	# Rec. plot
-	rec.col1='white',
-	### Lightest color in the recruitment plot.
-	rec.col2='black',
-	### Darkest color in the recruitment plot.
-	# General
-	main=NULL,
-	### Title of the plot.
-	contig.col=grey(0.85),
-	### Color of the Contig boundaries. Set to NA to ignore Contig boundaries.
-	# Return
-	ret.recplot=FALSE,
-	### Indicates if the matrix of the recruitment plot is to be returned.
-	ret.hist=FALSE,
-	### Ignored, for backwards compatibility.
-	ret.mode=FALSE,
-	### Indicates if the mode of the identity is to be computed. It requires the modeest
-	### package.
-	# General
-	id.cutoff=NULL,
-	### Minimum identity to consider an alignment as "top". By default, it is 0.95 for the
-	### identity metrics and 95% of the best scoring alignment for bit score.
-	verbose=TRUE,
-	### Indicates if the function should report the advance.
-	...
-	### Any additional graphic parameters to be passed to plot for all panels except the
-	### recruitment plot (lower-left).
-	){
-   # Settings
-   METRICS <- c('identity', 'corrected identity', 'bit score');
-   SUMMARY <- c('sum', 'average', 'median', '');
-   if(is.null(prefix)) stop('Parameter prefix is mandatory.');
-   if(!requireNamespace("gplots", quietly=TRUE)) stop('Unavailable gplots library.');
-   # Read files
-   if(verbose) cat("Reading files.\n")
-   rec <- read.table(paste(prefix, '.rec', sep=''), sep="\t", comment.char='', quote='');
-   lim <- read.table(paste(prefix, '.lim', sep=''), sep="\t", comment.char='', quote='');
-   # Configure ID summary
-   id.summary <- pmatch(id.summary, SUMMARY);
-   if(is.na(id.summary)) stop('Invalid identity summary.');
-   if(id.summary == -1) stop('Ambiguous identity summary.');
-   if(id.summary==1){
-      id.summary.func <- function(x) colSums(x);
-      id.summary.name <- 'sum'
-   }else if(id.summary==2){
-      id.summary.func <- function(x) colMeans(x);
-      id.summary.name <- 'mean'
-   }else if(id.summary==3){
-      id.summary.func <- function(x) apply(x,2,median);
-      id.summary.name <- 'median'
-   }else if(id.summary==4){
-      id.summary.func <- function(x) apply(x,2,quantile,probs=0.05,names=FALSE);
-      id.summary.name <- '90% LB'
-   }else if(id.summary==5){
-      id.summary.func <- function(x) apply(x,2,quantile,probs=0.95,names=FALSE);
-      id.summary.name <- '90% UB'
-   }else if(id.summary==6){
-      id.summary.func <- function(x) apply(x,2,quantile,probs=0.025,names=FALSE);
-      id.summary.name <- '95% LB'
-   }else if(id.summary==7){
-      id.summary.func <- function(x) apply(x,2,quantile,probs=0.975,names=FALSE);
-      id.summary.name <- '95% UB'
-   }
-   # Configure metrics
-   id.metric <- pmatch(id.metric, METRICS);
-   if(is.na(id.metric)) stop('Invalid identity metric.');
-   if(id.metric == -1) stop('Ambiguous identity metric.');
-   if(id.metric==1){
-      id.reccol <- 3
-      id.shortname <- 'Id.'
-      id.fullname  <- 'Identity'
-      id.units     <- '%'
-      id.hallmarks <- seq(0, 100, by=5)
-      if(is.null(id.max)) id.max <- 100
-      if(is.null(id.cutoff)) id.cutoff <- 95
-      if(is.null(id.binsize)) id.binsize <- 0.1
-   }else if(id.metric==2){
-      if(ncol(rec)<6) stop("Requesting corrected identity, but .rec file doesn't have 6th column")
-      id.reccol <- 6
-      id.shortname <- 'cId.'
-      id.fullname  <- 'Corrected identity'
-      id.units     <- '%'
-      id.hallmarks <- seq(0, 100, by=5)
-      if(is.null(id.max)) id.max <- 100
-      if(is.null(id.cutoff)) id.cutoff <- 95
-      if(is.null(id.binsize)) id.binsize <- 0.1
-   }else if(id.metric==3){
-      id.reccol <- 4
-      id.shortname <- 'BSc.'
-      id.fullname  <- 'Bit score'
-      id.units     <- 'bits'
-      max.bs <- max(rec[, id.reccol])
-      id.hallmarks <- seq(0, max.bs*1.2, by=50)
-      if(is.null(id.max)) id.max <- max.bs
-      if(is.null(id.cutoff)) id.cutoff <- 0.95 * max.bs
-      if(is.null(id.binsize)) id.binsize <- 5
-   }
-   if(is.null(id.min)) id.min <- min(rec[, id.reccol]);
-   if(is.null(pos.max)) pos.max <- max(lim[, 3]);
-   id.lim <- c(id.min, id.max);
-   pos.lim <- c(pos.min, pos.max)/1e6;
-   id.breaks <- round((id.max-id.min)/id.binsize);
-   pos.breaks <- round((pos.max-pos.min)/pos.binsize);
-   if(is.null(main)) main <- paste('Recruitment plot of ', prefix, sep='');
-   pos.marks=seq(pos.min, pos.max, length.out=pos.breaks+1)/1e6;
-   id.marks=seq(id.min, id.max, length.out=id.breaks+1);
-   id.topclasses <- 0;
-   for(i in length(id.marks):1) if(id.marks[i]>id.cutoff) id.topclasses <- id.topclasses + 1;
-   # Set-up image
-   layout(matrix(c(3,4,1,2), nrow=2, byrow=TRUE), widths=c(2,1), heights=c(1,2));
-   out <- list();
-   # Recruitment plot
-   if(verbose) cat("Rec. plot.\n")
-   par(mar=c(5,4,0,0)+0.1);
-   rec.hist <- matrix(0, nrow=pos.breaks, ncol=id.breaks);
-   for(i in 1:nrow(rec)){
-      id.class <- ceiling((id.breaks)*((rec[i, id.reccol]-id.min)/(id.max-id.min)));
-      if(id.class<=id.breaks & id.class>0){
-	 for(pos in rec[i, 1]:rec[i, 2]){
-	    pos.class <- ceiling((pos.breaks)*((pos-pos.min)/(pos.max-pos.min)));
-	    if(pos.class<=pos.breaks & pos.class>0) rec.hist[pos.class, id.class] <- rec.hist[pos.class, id.class]+1;
-	 }
-      }
-   }
-   id.top <- c((1-id.topclasses):0) + id.breaks;
-   rec.col=gplots::colorpanel(256, rec.col1, rec.col2);
-   image(x=pos.marks, y=id.marks, z=log10(rec.hist),
-   		breaks=seq(0, log10(max(rec.hist)), length.out=1+length(rec.col)), col=rec.col,
-		xlim=pos.lim, ylim=id.lim, xlab='Position in genome (Mbp)',
-		ylab=paste(id.fullname, ' (',id.units,')', sep=''), xaxs='i', yaxs='r');
-   if(!is.na(contig.col)) abline(v=c(lim$V2, lim$V3)/1e6, lty=1, col=contig.col);
-   abline(h=id.hallmarks, lty=2, col=grey(0.7));
-   abline(h=id.marks[id.top[1]], lty=3, col=grey(0.5))
-   legend('bottomleft', 'Rec. plot', bg=rgb(1,1,1,2/3));
-   out <- c(out, list(pos.marks=pos.marks, id.marks=id.marks));
-   if(ret.recplot) out <- c(out, list(recplot=rec.hist));
-   # Identity histogram
-   if(verbose) cat(id.shortname, " hist.\n", sep='')
-   par(mar=c(5,0,0,2)+0.1);
-   id.hist <- id.summary.func(rec.hist);
-   plot(1, t='n', xlim=c(1, max(id.hist)), ylim=id.lim, ylab='', yaxt='n', xlab=paste('Sequences (bp),', id.summary.name), log='x', ...);
-   id.x <- rep(id.marks, each=2)[2:(id.breaks*2+1)]
-   id.f <- rep(id.hist, each=2)[1:(id.breaks*2)]
-   if(sum(id.f)>0){
-      lines(id.f, id.x, lwd=ifelse(id.splines>0, 1/2, 2), type='o', pch='.');
-      if(id.splines>0){
-	 id.spline <- smooth.spline(id.x[id.f>0], log(id.f[id.f>0]), spar=id.splines)
-	 lines(exp(id.spline$y), id.spline$x, lwd=2)
-      }
-   }
-   abline(h=id.hallmarks, lty=2, col=grey(0.7));
-   abline(h=id.marks[id.top[1]], lty=3, col=grey(0.5))
-   legend('bottomright', paste(id.shortname, 'histogram'), bg=rgb(1,1,1,2/3));
-   out <- c(out, list(id.mean=mean(rec[, id.reccol])));
-   out <- c(out, list(id.median=median(rec[, id.reccol])));
-   if(ret.hist)  out <- c(out, list(id.hist=id.hist));
+#' Enveomics: Recruitment Plots
+#'
+#' @description
+#' Produces recruitment plots provided that BlastTab.catsbj.pl has
+#' been previously executed. Requires the \pkg{gplots} library.
+#'
+#' @param prefix
+#' Path to the prefix of the BlastTab.catsbj.pl output files. At
+#' least the files \strong{.rec} and \strong{.lim} must exist with this prefix.
+#' @param id.min
+#' Minimum identity to be considered. By default, the minimum detected
+#' identity. This value is a percentage.
+#' @param id.max
+#' Maximum identity to be considered. By default, 100\%.
+#' @param id.binsize
+#' Size of the identity bins (vertical histograms). By default, 0.1 for
+#' identity metrics and 5 for bit score.
+#' @param id.splines
+#' Smoothing parameter for the splines in the identity histogram. Zero (0) for no
+#' splines. A generally good value is 1/2. If non-zero, requires the \pkg{stats} package.
+#' @param id.metric
+#' Metric of identity to be used (Y-axis).
+#' It can be any unambiguous prefix of:
+#' \itemize{
+#' \item "identity"
+#' \item "corrected identity"
+#' \item "bit score"}
+#' @param id.summary
+#' Method used to build the identity histogram (Horizontal axis of the right panel).
+#' It can be any unambiguous prefix of:
+#' \itemize{
+#' \item "sum"
+#' \item "average"
+#' \item "median"
+#' \item "90\% lower bound"
+#' \item "90\% upper bound"
+#' \item "95\% lower bound"
+#' \item "95\% upper bound" }
+#' The last four options
+#' correspond to the upper and lower boundaries of the 90\% and 95\% empirical confidence
+#' intervals.
+#' @param pos.min
+#' Minimum (leftmost) position in the reference (concatenated) genome (in bp).
+#' @param pos.max
+#' Maximum (rightmost) position in the reference (concatenated) genome (in bp).
+#' By default: Length of the genome.
+#' @param pos.binsize
+#' Size of the position bins (horizontal histograms) in bp.
+#' @param pos.splines
+#' Smoothing parameter for the splines in the position histogram. Zero (0) for no splines.
+#' If non-zero, requires the stats package.
+#' @param rec.col1
+#' Lightest color in the recruitment plot.
+#' @param rec.col2
+#' Darkest color in the recruitment plot.
+#' @param main
+#' Title of the plot.
+#' @param contig.col
+#' Color of the Contig boundaries. Set to \code{NA} to ignore Contig boundaries.
+#' @param ret.recplot
+#' Indicates if the matrix of the recruitment plot is to be returned.
+#' @param ret.hist
+#' Ignored, for backwards compatibility.
+#' @param ret.mode
+#' Indicates if the mode of the identity is to be computed. It requires the
+#' \pkg{modeest} package.
+#' @param id.cutoff
+#' Minimum identity to consider an alignment as "top". By default, it is 0.95 for the
+#' identity metrics and 95\% of the best scoring alignment for bit score.
+#' @param verbose
+#' Indicates if the function should report the advance.
+#' @param ...
+#' Any additional graphic parameters to be passed to plot for all panels except the
+#' recruitment plot (lower-left).
+#'
+#' @return
+#'
+#' Returns a list with the following elements:
+#'
+#' \describe{
+#' \item{\code{pos.marks}}{Midpoints of the position histogram.}
+#' \item{\code{id.matrix}}{Midpoints of the identity histogram.}
+#' \item{\code{recplot}}{Matrix containing the recruitment plot values
+#'      (if \code{ret.recplot=TRUE}).}
+#' \item{\code{id.mean}}{Mean identity.}
+#' \item{\code{id.median}}{Median identity.}
+#' \item{\code{id.mode}}{Mode of the identity (if \code{ret.mode=TRUE}). Deprecated.}
+#' \item{\code{id.hist}}{Values of the identity histogram (if \code{ret.hist=TRUE}).}
+#' \item{\code{pos.hist.low}}{Values of the position histogram (depth) with "low"
+#'      identity (i.e., below id.cutoff) (if \code{ret.hist=TRUE}).}
+#' \item{\code{pos.hist.top}}{Values of the position histogram (depth) with "top"
+#'      identity (i.e., above id.cutoff) (if \code{ret.hist=TRUE}).}
+#' \item{\code{id.max}}{Value of \code{id.max}. This is returned because
+#'      \code{id.max=NULL} may vary.}
+#' \item{\code{id.cutoff}}{Value of \code{id.cutoff}.
+#'      This is returned because \code{id.cutoff=NULL} may vary.}
+#' \item{\code{seqdepth.mean.top}}{Average sequencing depth with identity above
+#'      \code{id.cutoff}.}
+#' \item{\code{seqdepth.mean.low}}{Average sequencing depth with identity below
+#'      \code{id.cutoff}.}
+#' \item{\code{seqdepth.mean.all}}{Average sequencing depth without identity filtering.}
+#' \item{\code{seqdepth.median.top}}{Median sequencing depth with identity above
+#'      \code{id.cutoff}.}
+#' \item{\code{seqdepth.median.low}}{Median sequencing depth with identity below
+#'      \code{id.cutoff}.}
+#' \item{\code{seqdepth.median.all}}{Median sequencing depth without identity filtering.}
+#' \item{\code{id.metric}}{Full name of the used identity metric.}
+#' \item{\code{id.summary}}{Full name of the summary method used to build the identity plot.}}
+#'
+#' @author Luis M. Rodriguez-R [aut, cre]
+#'
+#' @export
-   # Position histogram
-   if(verbose) cat("Pos. hist.\n")
-   par(mar=c(0,4,4,0)+0.1);
-   h1<-rep(0,nrow(rec.hist)) ;
-   h2<-rep(0,nrow(rec.hist)) ;
-   pos.winsize <- (pos.max-pos.min+1)/pos.breaks;
-   if(sum(rec.hist[, id.top])>0) h1 <- rowSums(matrix(rec.hist[, id.top], nrow=nrow(rec.hist)))/pos.winsize;
-   if(sum(rec.hist[,-id.top])>0) h2 <- rowSums(matrix(rec.hist[,-id.top], nrow=nrow(rec.hist)))/pos.winsize;
-   ymin <- min(1, h1[h1>0], h2[h2>0]);
-   ymax <- max(10, h1, h2);
-   if(is.na(ymin) || ymin<=0) ymin <- 1e-10;
-   if(is.na(ymax) || ymax<=0) ymax <- 1;
-   plot(1, t='n', xlab='', xaxt='n', ylab='Sequencing depth (X)', log='y', xlim=pos.lim,
-   	ylim=c(ymin, ymax), xaxs='i', main=main, ...);
-   if(!is.na(contig.col)) abline(v=c(lim[,2], lim[,3])/1e6, lty=1, col=contig.col);
-   abline(h=10^c(0:5), lty=2, col=grey(0.7));
-   if(sum(h2)>0){
-      h2.x <- rep(pos.marks, each=2)[2:(pos.breaks*2+1)]
-      h2.y <- rep(h2, each=2)[1:(pos.breaks*2)]
-      lines(h2.x, h2.y, lwd=ifelse(pos.splines>0, 1/2, 2), col=grey(0.5));
-      if(pos.splines>0){
-         h2.spline <- smooth.spline(h2.x[h2.y>0], log(h2.y[h2.y>0]), spar=pos.splines)
-	 lines(h2.spline$x, exp(h2.spline$y), lwd=2, col=grey(0.5))
-      }
-      if(ret.hist) out <- c(out, list(pos.hist.low=h2.y));
-   }
-   if(sum(h1)>0){
-      h1.x <- rep(pos.marks, each=2)[2:(pos.breaks*2+1)]
-      h1.y <- rep(h1, each=2)[1:(pos.breaks*2)]
-      lines(h1.x, h1.y, lwd=ifelse(pos.splines>0, 1/2, 2), col=grey(0));
-      if(pos.splines>0){
-         h1.spline <- smooth.spline(h1.x[h1.y>0], log(h1.y[h1.y>0]), spar=pos.splines)
-	 lines(h1.spline$x, exp(h1.spline$y), lwd=2, col=grey(0))
-      }
-      if(ret.hist) out <- c(out, list(pos.hist.top=h1.y));
-   }
-   legend('topleft', 'Pos. histogram', bg=rgb(1,1,1,2/3));
-   out <- c(out, list(id.max=id.max, id.cutoff=id.marks[id.top[1]]));
-   out <- c(out, list(seqdepth.mean.top=mean(h1)));
-   out <- c(out, list(seqdepth.mean.low=mean(h2)));
-   out <- c(out, list(seqdepth.mean=mean(h1+h2)));
-   out <- c(out, list(seqdepth.median.top=median(h1)));
-   out <- c(out, list(seqdepth.median.low=median(h2)));
-   out <- c(out, list(seqdepth.median=median(h1+h2)));
-   out <- c(out, list(id.metric=id.fullname));
-   out <- c(out, list(id.summary=id.summary.name));
-   # Legend
-   par(mar=c(0,0,4,2)+0.1);
-   plot(1, t='n', xlab='', xaxt='n', ylab='', yaxt='n', xlim=c(0,1), ylim=c(0,1), xaxs='r', yaxs='i', ...);
-   text(1/2, 5/6, labels=paste('Reads per ', signif((pos.max-pos.min)/pos.breaks, 2), ' bp (rec. plot)', sep=''), pos=3);
-   leg.col <- gplots::colorpanel(100, rec.col1, rec.col2);
-   leg.lab <- signif(10^seq(0, log10(max(rec.hist)), length.out=10), 2);
-   for(i in 1:10){
-      for(j in 1:10){
-         k <- (i-1)*10 + j;
-	 polygon(c(k-1, k, k, k-1)/100, c(2/3, 2/3, 5/6, 5/6), border=leg.col[k], col=leg.col[k]);
+enve.recplot <- structure(function(
+  prefix,
+  # Id. hist.
+  id.min=NULL,
+  id.max=NULL,
+  id.binsize=NULL,
+  id.splines=0,
+  id.metric='id',
+  id.summary='sum',
+  # Pos. hist.
+  pos.min=1,
+  pos.max=NULL,
+  pos.binsize=1e3,
+  pos.splines=0,
+  # Rec. plot
+  rec.col1='white',
+  rec.col2='black',
+  # General
+  main=NULL,
+  contig.col=grey(0.85),
+  # Return
+  ret.recplot=FALSE,
+  ret.hist=FALSE,
+  ret.mode=FALSE,
+  # General
+  id.cutoff=NULL,
+  verbose=TRUE,
+  ...
+){
+  # Settings
+  METRICS <- c('identity', 'corrected identity', 'bit score');
+  SUMMARY <- c('sum', 'average', 'median', '');
+  if(is.null(prefix)) stop('Parameter prefix is mandatory.');
+  if(!requireNamespace("gplots", quietly=TRUE)) stop('Unavailable gplots library.');
+  # Read files
+  if(verbose) cat("Reading files.\n")
+  rec <- read.table(paste(prefix, '.rec', sep=''), sep="\t", comment.char='', quote='');
+  lim <- read.table(paste(prefix, '.lim', sep=''), sep="\t", comment.char='', quote='');
+  # Configure ID summary
+  id.summary <- pmatch(id.summary, SUMMARY);
+  if(is.na(id.summary)) stop('Invalid identity summary.');
+  if(id.summary == -1) stop('Ambiguous identity summary.');
+  if(id.summary==1){
+    id.summary.func <- function(x) colSums(x);
+    id.summary.name <- 'sum'
+  }else if(id.summary==2){
+    id.summary.func <- function(x) colMeans(x);
+    id.summary.name <- 'mean'
+  }else if(id.summary==3){
+    id.summary.func <- function(x) apply(x,2,median);
+    id.summary.name <- 'median'
+  }else if(id.summary==4){
+    id.summary.func <- function(x) apply(x,2,quantile,probs=0.05,names=FALSE);
+    id.summary.name <- '90% LB'
+  }else if(id.summary==5){
+    id.summary.func <- function(x) apply(x,2,quantile,probs=0.95,names=FALSE);
+    id.summary.name <- '90% UB'
+  }else if(id.summary==6){
+    id.summary.func <- function(x) apply(x,2,quantile,probs=0.025,names=FALSE);
+    id.summary.name <- '95% LB'
+  }else if(id.summary==7){
+    id.summary.func <- function(x) apply(x,2,quantile,probs=0.975,names=FALSE);
+    id.summary.name <- '95% UB'
+  }
+  # Configure metrics
+  id.metric <- pmatch(id.metric, METRICS);
+  if(is.na(id.metric)) stop('Invalid identity metric.');
+  if(id.metric == -1) stop('Ambiguous identity metric.');
+  if(id.metric==1){
+    id.reccol <- 3
+    id.shortname <- 'Id.'
+    id.fullname  <- 'Identity'
+    id.units     <- '%'
+    id.hallmarks <- seq(0, 100, by=5)
+    if(is.null(id.max)) id.max <- 100
+    if(is.null(id.cutoff)) id.cutoff <- 95
+    if(is.null(id.binsize)) id.binsize <- 0.1
+  }else if(id.metric==2){
+    if(ncol(rec)<6) stop("Requesting corrected identity, but .rec file doesn't have 6th column")
+    id.reccol <- 6
+    id.shortname <- 'cId.'
+    id.fullname  <- 'Corrected identity'
+    id.units     <- '%'
+    id.hallmarks <- seq(0, 100, by=5)
+    if(is.null(id.max)) id.max <- 100
+    if(is.null(id.cutoff)) id.cutoff <- 95
+    if(is.null(id.binsize)) id.binsize <- 0.1
+  }else if(id.metric==3){
+    id.reccol <- 4
+    id.shortname <- 'BSc.'
+    id.fullname  <- 'Bit score'
+    id.units     <- 'bits'
+    max.bs <- max(rec[, id.reccol])
+    id.hallmarks <- seq(0, max.bs*1.2, by=50)
+    if(is.null(id.max)) id.max <- max.bs
+    if(is.null(id.cutoff)) id.cutoff <- 0.95 * max.bs
+    if(is.null(id.binsize)) id.binsize <- 5
+  }
+  if(is.null(id.min)) id.min <- min(rec[, id.reccol]);
+  if(is.null(pos.max)) pos.max <- max(lim[, 3]);
+  id.lim <- c(id.min, id.max);
+  pos.lim <- c(pos.min, pos.max)/1e6;
+  id.breaks <- round((id.max-id.min)/id.binsize);
+  pos.breaks <- round((pos.max-pos.min)/pos.binsize);
+  if(is.null(main)) main <- paste('Recruitment plot of ', prefix, sep='');
+  pos.marks=seq(pos.min, pos.max, length.out=pos.breaks+1)/1e6;
+  id.marks=seq(id.min, id.max, length.out=id.breaks+1);
+  id.topclasses <- 0;
+  for(i in length(id.marks):1) if(id.marks[i]>id.cutoff) id.topclasses <- id.topclasses + 1;
+  # Set-up image
+  layout(matrix(c(3,4,1,2), nrow=2, byrow=TRUE), widths=c(2,1), heights=c(1,2));
+  out <- list();
+  # Recruitment plot
+  if(verbose) cat("Rec. plot.\n")
+  par(mar=c(5,4,0,0)+0.1);
+  rec.hist <- matrix(0, nrow=pos.breaks, ncol=id.breaks);
+  for(i in 1:nrow(rec)){
+    id.class <- ceiling((id.breaks)*((rec[i, id.reccol]-id.min)/(id.max-id.min)));
+    if(id.class<=id.breaks & id.class>0){
+      for(pos in rec[i, 1]:rec[i, 2]){
+        pos.class <- ceiling((pos.breaks)*((pos-pos.min)/(pos.max-pos.min)));
+        if(pos.class<=pos.breaks & pos.class>0) rec.hist[pos.class, id.class] <- rec.hist[pos.class, id.class]+1;
       }
-      text((i-0.5)/10, 2/3, labels=paste(leg.lab[i], ''), srt=90, pos=2, offset=0, cex=3/4);
-   }
-   legend('bottom',
-   	legend=c('Contig boundary', 'Hallmark', paste(id.fullname, 'cutoff'),
-		paste('Pos. hist.: ',id.shortname,' > ',signif(id.marks[id.top[1]],2),id.units,sep=''),
-		paste('Pos. hist.: ',id.shortname,' < ',signif(id.marks[id.top[1]],2),id.units,sep='')), ncol=2,
-   	col=grey(c(0.85, 0.7, 0.5, 0, 0.5)), lty=c(1,2,3,1,1), lwd=c(1,1,1,2,2), bty='n', inset=0.05, cex=5/6);
-   return(out);
-   ### A list with the following elements:
-   ###
-   ### pos.marks: Midpoints of the position histogram.
-   ###
-   ### id.matrix: Midpoints of the identity histogram.
-   ###
-   ### recplot (if ret.recplot=TRUE): Matrix containing the recruitment plot values.
-   ###
-   ### id.mean: Mean identity.
-   ###
-   ### id.median: Median identity.
-   ###
-   ### id.mode (if ret.mode=TRUE): Mode of the identity. Deprecated.
-   ###
-   ### id.hist (if ret.hist=TRUE): Values of the identity histogram.
-   ###
-   ### pos.hist.low (if ret.hist=TRUE): Values of the position histogram (depth) with "low"
-   ### identity (i.e., below id.cutoff).
-   ###
-   ### pos.hist.top (if ret.hist=TRUE): Values of the position histogram (depth) with "top"
-   ### identity (i.e., above id.cutoff).
-   ###
-   ### id.max: Value of id.max. This is returned because id.max=NULL may vary.
-   ###
-   ### id.cutoff: Value of id.cutoff. This is returned because id.cutoff=NULL may vary.
-   ###
-   ### seqdepth.mean.top: Average sequencing depth with identity above id.cutoff.
-   ###
-   ### seqdepth.mean.low: Average sequencing depth with identity below id.cutoff.
-   ###
-   ### seqdepth.mean.all: Average sequencing depth without identity filtering.
-   ###
-   ### seqdepth.median.top: Median sequencing depth with identity above id.cutoff.
-   ###
-   ### seqdepth.median.low: Median sequencing depth with identity below id.cutoff.
-   ###
-   ### seqdepth.median.all: Median sequencing depth without identity filtering.
-   ###
-   ### id.metric: Full name of the used identity metric.
-   ###
-   ### id.summary: Full name of the summary method used to build the identity plot.
+    }
+  }
+  id.top <- c((1-id.topclasses):0) + id.breaks;
+  rec.col=gplots::colorpanel(256, rec.col1, rec.col2);
+  image(x=pos.marks, y=id.marks, z=log10(rec.hist),
+        breaks=seq(0, log10(max(rec.hist)), length.out=1+length(rec.col)), col=rec.col,
+        xlim=pos.lim, ylim=id.lim, xlab='Position in genome (Mbp)',
+        ylab=paste(id.fullname, ' (',id.units,')', sep=''), xaxs='i', yaxs='r');
+  if(!is.na(contig.col)) abline(v=c(lim$V2, lim$V3)/1e6, lty=1, col=contig.col);
+  abline(h=id.hallmarks, lty=2, col=grey(0.7));
+  abline(h=id.marks[id.top[1]], lty=3, col=grey(0.5))
+  legend('bottomleft', 'Rec. plot', bg=rgb(1,1,1,2/3));
+  out <- c(out, list(pos.marks=pos.marks, id.marks=id.marks));
+  if(ret.recplot) out <- c(out, list(recplot=rec.hist));
+  # Identity histogram
+  if(verbose) cat(id.shortname, " hist.\n", sep='')
+  par(mar=c(5,0,0,2)+0.1);
+  id.hist <- id.summary.func(rec.hist);
+  plot(1, t='n', xlim=c(1, max(id.hist)), ylim=id.lim, ylab='', yaxt='n', xlab=paste('Sequences (bp),', id.summary.name), log='x', ...);
+  id.x <- rep(id.marks, each=2)[2:(id.breaks*2+1)]
+  id.f <- rep(id.hist, each=2)[1:(id.breaks*2)]
+  if(sum(id.f)>0){
+    lines(id.f, id.x, lwd=ifelse(id.splines>0, 1/2, 2), type='o', pch='.');
+    if(id.splines>0){
+      id.spline <- smooth.spline(id.x[id.f>0], log(id.f[id.f>0]), spar=id.splines)
+      lines(exp(id.spline$y), id.spline$x, lwd=2)
+    }
+  }
+  abline(h=id.hallmarks, lty=2, col=grey(0.7));
+  abline(h=id.marks[id.top[1]], lty=3, col=grey(0.5))
+  legend('bottomright', paste(id.shortname, 'histogram'), bg=rgb(1,1,1,2/3));
+  out <- c(out, list(id.mean=mean(rec[, id.reccol])));
+  out <- c(out, list(id.median=median(rec[, id.reccol])));
+  if(ret.hist)  out <- c(out, list(id.hist=id.hist));
+  # Position histogram
+  if(verbose) cat("Pos. hist.\n")
+  par(mar=c(0,4,4,0)+0.1);
+  h1<-rep(0,nrow(rec.hist)) ;
+  h2<-rep(0,nrow(rec.hist)) ;
+  pos.winsize <- (pos.max-pos.min+1)/pos.breaks;
+  if(sum(rec.hist[, id.top])>0) h1 <- rowSums(matrix(rec.hist[, id.top], nrow=nrow(rec.hist)))/pos.winsize;
+  if(sum(rec.hist[,-id.top])>0) h2 <- rowSums(matrix(rec.hist[,-id.top], nrow=nrow(rec.hist)))/pos.winsize;
+  ymin <- min(1, h1[h1>0], h2[h2>0]);
+  ymax <- max(10, h1, h2);
+  if(is.na(ymin) || ymin<=0) ymin <- 1e-10;
+  if(is.na(ymax) || ymax<=0) ymax <- 1;
+  plot(1, t='n', xlab='', xaxt='n', ylab='Sequencing depth (X)', log='y', xlim=pos.lim,
+       ylim=c(ymin, ymax), xaxs='i', main=main, ...);
+  if(!is.na(contig.col)) abline(v=c(lim[,2], lim[,3])/1e6, lty=1, col=contig.col);
+  abline(h=10^c(0:5), lty=2, col=grey(0.7));
+  if(sum(h2)>0){
+    h2.x <- rep(pos.marks, each=2)[2:(pos.breaks*2+1)]
+    h2.y <- rep(h2, each=2)[1:(pos.breaks*2)]
+    lines(h2.x, h2.y, lwd=ifelse(pos.splines>0, 1/2, 2), col=grey(0.5));
+    if(pos.splines>0){
+      h2.spline <- smooth.spline(h2.x[h2.y>0], log(h2.y[h2.y>0]), spar=pos.splines)
+      lines(h2.spline$x, exp(h2.spline$y), lwd=2, col=grey(0.5))
+    }
+    if(ret.hist) out <- c(out, list(pos.hist.low=h2.y));
+  }
+  if(sum(h1)>0){
+    h1.x <- rep(pos.marks, each=2)[2:(pos.breaks*2+1)]
+    h1.y <- rep(h1, each=2)[1:(pos.breaks*2)]
+    lines(h1.x, h1.y, lwd=ifelse(pos.splines>0, 1/2, 2), col=grey(0));
+    if(pos.splines>0){
+      h1.spline <- smooth.spline(h1.x[h1.y>0], log(h1.y[h1.y>0]), spar=pos.splines)
+      lines(h1.spline$x, exp(h1.spline$y), lwd=2, col=grey(0))
+    }
+    if(ret.hist) out <- c(out, list(pos.hist.top=h1.y));
+  }
+  legend('topleft', 'Pos. histogram', bg=rgb(1,1,1,2/3));
+  out <- c(out, list(id.max=id.max, id.cutoff=id.marks[id.top[1]]));
+  out <- c(out, list(seqdepth.mean.top=mean(h1)));
+  out <- c(out, list(seqdepth.mean.low=mean(h2)));
+  out <- c(out, list(seqdepth.mean=mean(h1+h2)));
+  out <- c(out, list(seqdepth.median.top=median(h1)));
+  out <- c(out, list(seqdepth.median.low=median(h2)));
+  out <- c(out, list(seqdepth.median=median(h1+h2)));
+  out <- c(out, list(id.metric=id.fullname));
+  out <- c(out, list(id.summary=id.summary.name));
+  # Legend
+  par(mar=c(0,0,4,2)+0.1);
+  plot(1, t='n', xlab='', xaxt='n', ylab='', yaxt='n', xlim=c(0,1), ylim=c(0,1), xaxs='r', yaxs='i', ...);
+  text(1/2, 5/6, labels=paste('Reads per ', signif((pos.max-pos.min)/pos.breaks, 2), ' bp (rec. plot)', sep=''), pos=3);
+  leg.col <- gplots::colorpanel(100, rec.col1, rec.col2);
+  leg.lab <- signif(10^seq(0, log10(max(rec.hist)), length.out=10), 2);
+  for(i in 1:10){
+    for(j in 1:10){
+      k <- (i-1)*10 + j;
+      polygon(c(k-1, k, k, k-1)/100, c(2/3, 2/3, 5/6, 5/6), border=leg.col[k], col=leg.col[k]);
+    }
+    text((i-0.5)/10, 2/3, labels=paste(leg.lab[i], ''), srt=90, pos=2, offset=0, cex=3/4);
+  }
+  legend('bottom',
+         legend=c('Contig boundary', 'Hallmark', paste(id.fullname, 'cutoff'),
+                  paste('Pos. hist.: ',id.shortname,' > ',signif(id.marks[id.top[1]],2),id.units,sep=''),
+                  paste('Pos. hist.: ',id.shortname,' < ',signif(id.marks[id.top[1]],2),id.units,sep='')), ncol=2,
+         col=grey(c(0.85, 0.7, 0.5, 0, 0.5)), lty=c(1,2,3,1,1), lwd=c(1,1,1,2,2), bty='n', inset=0.05, cex=5/6);
+  return(out);
 });