npm - @sjcrh/proteinpaint-server - Versions diffs - 2.109.1 → 2.110.0 - Mend

@sjcrh/proteinpaint-server 2.109.1 → 2.110.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/utils/edge.R CHANGED Viewed

@@ -115,27 +115,42 @@ filter_time <- system.time({
 normalization_time <- system.time({
     y <- y[keep, keep.lib.sizes = FALSE]
-    y <- calcNormFactors(y, method = "TMM")
+    y <- normLibSizes(y) # Using TMM method for normalization
 })
 #cat("Normalization time: ", normalization_time[3], " seconds\n")
+# Saving MDS plot image
+set.seed(as.integer(Sys.time())) # Set the seed according to current time
+cachedir <- input$cachedir # Importing serverconfig.cachedir
+random_number <- runif(1, min = 0, max = 1) # Generating random number
+mds_image_name <- paste0("edgeR_mds_temp_",random_number,".png") # Generating random image name so that simultaneous server side requests do NOT generate the same edgeR file name
+png(filename = paste0(cachedir,"/",mds_image_name), width = 1000, height = 1000, res = 200) # Opening a png device
+par(oma = c(1, 1, 1, 1)) # Creating a margin
+plotMDS(y) # Plot the edgeR MDS plot
+# dev.off() # Gives a null device message which breaks JSON. Commenting it out for now, will investigate it later
 # Differential expression analysis
 if (length(input$conf1) == 0) { # No adjustment of confounding factors
-    dispersion_time <- system.time({
+    design <- model.matrix(~conditions) # Based on the protocol defined in section 1.4 of edgeR manual https://bioconductor.org/packages/release/bioc/vignettes/edgeR/inst/doc/edgeRUsersGuide.pdf
+    fit_time <- system.time({
         suppressWarnings({
             suppressMessages({
-                y <- estimateDisp(y)
+                fit <- glmQLFit(y,design) # The glmQLFit() replaces glmFit() which implements the quasi-likelihood function. This is better able to account for overdispersion as it employs a more lenient approach where variance is not a fixed function of the mean.
             })
         })
     })
-    #cat("Dispersion time: ", dispersion_time[3], " seconds\n")
+    #cat("QL fit time: ", fit_time[3], " seconds\n")
-    exact_test_time <- system.time({
-        et <- exactTest(y)
+    test_time <- system.time({
+        suppressWarnings({
+            suppressMessages({
+                et <- glmQLFTest(fit)
+            })
+        })
     })
-    #cat("Exact test time: ", exact_test_time[3], " seconds\n")
+    #cat("QL test time: ", test_time[3], " seconds\n")
 } else { # Adjusting for confounding factors
     # Check the type of confounding variable
     if (input$conf1_mode == "continuous") { # If this is float, the input conf1 vector should be converted into a numeric vector
       conf1 <- as.numeric(input$conf1)
@@ -144,7 +159,7 @@ if (length(input$conf1) == 0) { # No adjustment of confounding factors
     }
     if (length(input$conf2) == 0) { # No adjustment of confounding factor 2
-          y$samples <- data.frame(conditions = conditions, conf1 = conf1)
+          y$samples <- data.frame(y$samples, conditions = conditions, conf1 = conf1)
           model_gen_time <- system.time({
                  design <- model.matrix(~ conditions + conf1, data = y$samples)
           })
@@ -156,29 +171,41 @@ if (length(input$conf1) == 0) { # No adjustment of confounding factors
           } else { # When input$conf2_mode == "discrete" keep the vector as string.
             conf2 <- as.factor(input$conf2)
           }
-          y$samples <- data.frame(conditions = conditions, conf1 = conf1, conf2 = conf2)
+          y$samples <- data.frame(y$samples, conditions = conditions, conf1 = conf1, conf2 = conf2)
           model_gen_time <- system.time({
                  design <- model.matrix(~ conditions + conf1 + conf2, data = y$samples)
           })
           #cat("Time for making design matrix: ", model_gen_time[3], " seconds\n")
     }
-    dispersion_time <- system.time({
-        y <- estimateDisp(y, design)
-    })
-    #cat("Dispersion time: ", dispersion_time[3], " seconds\n")
     fit_time <- system.time({
-        fit <- glmFit(y, design)
+        suppressWarnings({
+            suppressMessages({
+                fit <- glmQLFit(y,design)
+            })
+        })
     })
-    #cat("Fit time: ", fit_time[3], " seconds\n")
-    test_statistics_time <- system.time({
-        et <- glmLRT(fit, coef = "conditionsDiseased")
+    #cat("QL fit time: ", fit_time[3], " seconds\n")
+    test_time <- system.time({
+        suppressWarnings({
+            suppressMessages({
+                et <- glmQLFTest(fit, coef = "conditionsDiseased")
+            })
+        })
     })
-    #cat("Test statistics time: ", test_statistics_time[3], " seconds\n")
+    #cat("QL test time: ", test_time[3], " seconds\n")
 }
+# Saving QL fit image
+set.seed(as.integer(Sys.time())) # Set the seed according to current time
+cachedir <- input$cachedir # Importing serverconfig.cachedir
+random_number <- runif(1, min = 0, max = 1) # Generating random number
+ql_image_name <- paste0("edgeR_ql_temp_",random_number,".png") # Generating random image name so that simultaneous server side requests do NOT generate the same edgeR file name
+png(filename = paste0(cachedir,"/",ql_image_name), width = 1000, height = 1000, res = 200) # Opening a png device
+par(oma = c(1, 1, 1, 1)) # Creating a margin
+plotQLDisp(fit) # Plot the edgeR fit
+# dev.off() # Gives a null device message which breaks JSON. Commenting it out for now, will investigate it later
 # Multiple testing correction
 multiple_testing_correction_time <- system.time({
     logfc <- et$table$logFC
@@ -195,10 +222,14 @@ multiple_testing_correction_time <- system.time({
     names(output)[4] <- "original_p_value"
     names(output)[5] <- "adjusted_p_value"
 })
+final_output <- c()
+final_output$gene_data <- output
+final_output$edgeR_ql_image_name <- ql_image_name
+final_output$edgeR_mds_image_name <- mds_image_name
 #cat("Time for multiple testing correction: ", multiple_testing_correction_time[3], " seconds\n")
 # Output results
-toJSON(output)
+toJSON(final_output)
 #-----------------------------------#
 # Will implement this later