mqppep_anova: mqppep_anova_script.Rmd comparison

comparison mqppep_anova_script.Rmd @ 12:4deacfee76ef draft

"planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/mqppep commit e87d28ea433cc26db7fe44768685d08c06f7a0d0"

author	eschen42
date	Tue, 15 Mar 2022 18:17:55 +0000
parents	d728198f1ba5
children	b41a077af3aa

comparison

equal deleted inserted replaced

-:254ab97c6a2c
+:4deacfee76ef
 alphaFile: "test-data/alpha_levels.tabular"
 firstDataColumn: "Intensity"
 imputationMethod: !r c("group-median", "median", "mean", "random")[1]
 meanPercentile: 1
 sdPercentile: 0.2
-regexSampleNames: "\\.(\\d+)[A-Z]$"
+regexSampleNames: "\\.\\d+[A-Z]$"
-regexSampleGrouping: "(\\d+)"
+regexSampleGrouping: "\\d+"
 imputedDataFilename: "Upstream_Map_pST_outputfile_STEP4_QN_LT.txt"
 ---
 ```{r setup, include = FALSE}
 # ref for parameterizing Rmd document: https://stackoverflow.com/a/37940285
 knitr::opts_chunk$set(echo = FALSE, fig.dim = c(9, 10))
 m2 <- regexpr(regex_sample_grouping, temp_matches, perl = TRUE)
 sample_factor_levels <- as.factor(regmatches(temp_matches, m2))
 if (length(levels(sample_factor_levels)) < 2) {
+nuke_control_sequences <-
+function(s) {
+s <- gsub("[\\]", "xyzzy_plugh", s)
+s <- gsub("[$]", "\\\\$", s)
+s <- gsub("xyzzy_plugh", "$\\\\backslash$", s)
+return(s)
+}
 cat(
 "ERROR!!!! Cannot perform ANOVA analysis",
-"because it requires two or more factor levels\n"
+"(see next page)\\newpage\n"
 )
-cat("Unparsed sample names are:\n")
+cat(
-print(names(quant_data_imp_qn_log))
+"ERROR: ANOVA analysis",
-cat(sprintf("Parsing rule for SampleNames is '%s'\n", regex_sample_names))
+"requires two or more factor levels!\\newline\n"
-cat("Parsed names are:\n")
+)
-print(temp_matches)
-cat(sprintf(
+cat("\\newline\\newline\n")
-"Parsing rule for SampleGrouping is '%s'\n",
+cat("Unparsed sample names are:\\newline\n",
-regex_sample_grouping
+"\\begin{quote}\n",
-))
+paste(names(quant_data_imp_qn_log), collapse = "\\newline\n"),
-cat("Sample group assignments are:\n")
+"\n\\end{quote}\n\n")
-print(regmatches(temp_matches, m2))
+regex_sample_names <- nuke_control_sequences(regex_sample_names)
+cat("\\leavevmode\\newline\n")
+cat("Parsing rule for SampleNames is",
+"\\newline\n",
+"\\text{'",
+regex_sample_names,
+"'}\\newline\n",
+sep = ""
+)
+cat("\nParsed sample names are:\n",
+"\\begin{quote}\n",
+paste(temp_matches, collapse = "\\newline\n"),
+"\n\\end{quote}\n\n")
+regex_sample_grouping <- nuke_control_sequences(regex_sample_grouping)
+cat("\\leavevmode\\newline\n")
+cat("Parsing rule for SampleGrouping is",
+"\\newline\n",
+"\\text{'",
+regex_sample_grouping,
+"'}\\newline\n",
+sep = ""
+)
+cat("\\newline\n")
+cat("Sample group assignments are:\n",
+"\\begin{quote}\n",
+paste(regmatches(temp_matches, m2), collapse = "\\newline\n"),
+"\n\\end{quote}\n\n")
 } else {
 p_value_data_anova_ps <-
 apply(
 quant_data_imp_qn_log,
 1,
 else
 paste0("(%0.4e) %s")
 }
 )
 anova_filtered <- data.table(
 anova_filtered_merge$Phosphopeptide
 ,
 anova_filtered_merge$Intensity
 ,
 anova_filtered_merge[, 2:number_of_samples + 1]
 )
 colnames(anova_filtered) <-
 c("Phosphopeptide", colnames(filtered_data_filtered))
-# merge qualitative columns into the ANOVA data
+# Merge qualitative columns into the ANOVA data
 output_table <- data.frame(anova_filtered$Phosphopeptide)
 output_table <- merge(
 x = output_table
 ,
 y = data_table_imp_qn_lt
 by.x = "anova_filtered.Phosphopeptide"
 ,
 by.y = "Phosphopeptide"
 )
-#Produce heatmap to visualize significance and the effect of imputation
+# Produce heatmap to visualize significance and the effect of imputation
 m <-
 as.matrix(unimputed_quant_data_log[anova_filtered_merge_order, ])
+m_nan_rows <- rowSums(
+matrix(
+as.integer(is.na(m)),
+nrow = nrow(m)
+)
+)
+m <- m[!m_nan_rows, ]
 if (nrow(m) > 0) {
 rownames_m <- rownames(m)
 rownames(m) <- sapply(
 X = seq_len(nrow(m))
 ,
 FUN = function(i) {
 sprintf(
-anova_filtered_merge_format[i]
+anova_filtered_merge_format[i],
-,
+filtered_p$fdr_adjusted_anova_p[i],
-filtered_p$fdr_adjusted_anova_p[i]
-,
 rownames_m[i]
 )
 }
 )
-margins <- c(max(nchar(colnames(m))) * 10 / 16 # col
+margins <-
-, max(nchar(rownames(m))) * 5 / 16 # row
+c(max(nchar(colnames(m))) * 10 / 16 # col
-)
+, max(nchar(rownames(m))) * 5 / 16 # row
-how_many_peptides <- min(50, nrow(m))
+)
+how_many_peptides <- min(50, nrow(m))
-cat("\\newpage\n")
-if (nrow(m) > 50) {
+cat("\\newpage\n")
-cat("Heatmap for the 50 most-significant peptides",
+if (nrow(m) > 50) {
-sprintf(
+cat("Heatmap for the 50 most-significant peptides",
-"whose adjusted p-value < %0.2f\n",
+sprintf(
-cutoff)
+"whose adjusted p-value < %0.2f\n",
-)
+cutoff)
-} else {
+)
-cat("Heatmap for peptides whose",
+} else {
-sprintf("adjusted p-value < %0.2f\n",
+cat("Heatmap for peptides whose",
-cutoff)
+sprintf("adjusted p-value < %0.2f\n",
-)
+cutoff)
-}
+)
-cat("\\newline\n")
+}
 cat("\\newline\n")
-op <- par("cex.main")
+cat("\\newline\n")
-try(
+op <- par("cex.main")
-if (nrow(m) > 1) {
+try(
-par(cex.main = 0.6)
+if (nrow(m) > 1) {
-heatmap(
+par(cex.main = 0.6)
-m[how_many_peptides:1, ],
+heatmap(
-Rowv = NA,
+m[how_many_peptides:1, ],
-Colv = NA,
+Rowv = NA,
-cexRow = 0.7,
+Colv = NA,
-cexCol = 0.8,
+cexRow = 0.7,
-scale = "row",
+cexCol = 0.8,
-margins = margins,
+scale = "row",
-main =
+#ACE scale = "none",
-"Heatmap of unimputed, unnormalized intensities",
+margins = margins,
-xlab = ""
+main =
-)
+"Heatmap of unimputed, unnormalized intensities",
-}
+xlab = ""
 )
-par(op)
+}
+)
+par(op)
 }
 }
 }
 }
 ```

Mercurial > repos > eschen42 > mqppep_anova

comparison mqppep_anova_script.Rmd @ 12:4deacfee76ef draft