Mercurial > repos > iuc > multigsea
changeset 1:c06f093f3758 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/multigsea commit eb12f339f6f2e72792e6db36848222227d43d008
| author | iuc |
|---|---|
| date | Fri, 28 Feb 2025 10:25:26 +0000 |
| parents | d1925dbabe98 |
| children | |
| files | macros.xml multiGSEA.R multigsea.xml |
| diffstat | 3 files changed, 135 insertions(+), 111 deletions(-) [+] |
line wrap: on
line diff
--- a/macros.xml Wed Jun 07 19:48:35 2023 +0000 +++ b/macros.xml Fri Feb 28 10:25:26 2025 +0000 @@ -1,23 +1,23 @@ <macros> - <token name="@TOOL_VERSION@">1.8.0</token> - <token name="@SUFFIX_VERSION@">0</token> + <token name="@TOOL_VERSION@">1.12.0</token> + <token name="@SUFFIX_VERSION@">1</token> <token name="@PROFILE@">20.05</token> <xml name="requirements"> <requirements> <requirement type="package" version="@TOOL_VERSION@">bioconductor-multigsea</requirement> - <requirement type="package" version="2.2.1">r-argparse</requirement> + <requirement type="package" version="2.2.2">r-argparse</requirement> <requirement type="package" version="1.0.0">bioconductor-metaboliteidmapping</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Hs.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Mm.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Rn.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Cf.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Bt.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Ss.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Gg.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Xl.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Dr.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Dm.eg.db</requirement> - <requirement type="package" version="3.16.0">bioconductor-org.Ce.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Hs.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Mm.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Rn.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Cf.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Bt.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Ss.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Gg.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Xl.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Dr.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Dm.eg.db</requirement> + <requirement type="package" version="3.18.0">bioconductor-org.Ce.eg.db</requirement> </requirements> </xml> <xml name="citations">
--- a/multiGSEA.R Wed Jun 07 19:48:35 2023 +0000 +++ b/multiGSEA.R Fri Feb 28 10:25:26 2025 +0000 @@ -1,6 +1,7 @@ library(multiGSEA, - quietly = TRUE, - warn.conflicts = FALSE) + quietly = TRUE, + warn.conflicts = FALSE +) library(argparse, quietly = TRUE, warn.conflicts = FALSE) ################################################################################ @@ -11,56 +12,69 @@ # Collect arguments from command line parser <- ArgumentParser(description = "multiGSEA R script") -parser$add_argument("--transcriptomics", required = FALSE, - help = "Transcriptomics data") +parser$add_argument("--transcriptomics", + required = FALSE, + help = "Transcriptomics data" +) parser$add_argument( - "--transcriptome_ids", - required = FALSE, - help = "Transcriptomics ids", - default = "SYMBOL" + "--transcriptome_ids", + required = FALSE, + help = "Transcriptomics ids", + default = "SYMBOL" ) -parser$add_argument("--proteomics", required = FALSE, - help = "Proteomics data") +parser$add_argument("--proteomics", + required = FALSE, + help = "Proteomics data" +) parser$add_argument( - "--proteome_ids", - required = FALSE, - help = "Proteomics ids", - default = "SYMBOL" + "--proteome_ids", + required = FALSE, + help = "Proteomics ids", + default = "SYMBOL" ) -parser$add_argument("--metabolomics", required = FALSE, - help = "Metabolomics data") +parser$add_argument("--metabolomics", + required = FALSE, + help = "Metabolomics data" +) parser$add_argument( - "--metabolome_ids", - required = FALSE, - help = "Metabolomics ids", - default = "HMDB" + "--metabolome_ids", + required = FALSE, + help = "Metabolomics ids", + default = "HMDB" ) -parser$add_argument("--organism", required = TRUE, - help = "Organism") -parser$add_argument("--combine_pvalues", required = TRUE, - help = "Combine p-values method") -parser$add_argument("--padj_method", required = TRUE, - help = "P-adjustment method") +parser$add_argument("--organism", + required = TRUE, + help = "Organism" +) +parser$add_argument("--combine_pvalues", + required = TRUE, + help = "Combine p-values method" +) +parser$add_argument("--padj_method", + required = TRUE, + help = "P-adjustment method" +) parser$add_argument("--databases", - required = TRUE, - help = "Pathway databases") + required = TRUE, + help = "Pathway databases" +) args <- parser$parse_args() ## ----Load library------------------------------------------------------------- organism_mapping <- c( - "hsapiens" = "org.Hs.eg.db", - "mmusculus" = "org.Mm.eg.db", - "rnorvegicus" = "org.Rn.eg.db", - "cfamiliaris" = "org.Cf.eg.db", - "btaurus" = "org.Bt.eg.db", - "sscrofa" = "org.Ss.eg.db", - "ggallus" = "org.Gg.eg.db", - "drerio" = "org.Xl.eg.db", - "xlaevis" = "org.Dr.eg.db", - "dmelanogaster" = "org.Dm.eg.db", - "celegans" = "org.Ce.eg.db" + "hsapiens" = "org.Hs.eg.db", + "mmusculus" = "org.Mm.eg.db", + "rnorvegicus" = "org.Rn.eg.db", + "cfamiliaris" = "org.Cf.eg.db", + "btaurus" = "org.Bt.eg.db", + "sscrofa" = "org.Ss.eg.db", + "ggallus" = "org.Gg.eg.db", + "drerio" = "org.Xl.eg.db", + "xlaevis" = "org.Dr.eg.db", + "dmelanogaster" = "org.Dm.eg.db", + "celegans" = "org.Ce.eg.db" ) library(organism_mapping[args$organism], character.only = TRUE) @@ -71,29 +85,31 @@ layer <- c() if (!is.null(args$transcriptomics)) { - transcriptome <- read.csv( - args$transcriptomics, - header = TRUE, - sep = "\t", - dec = "." - ) - layer <- append(layer, "transcriptome") + transcriptome <- read.csv( + args$transcriptomics, + header = TRUE, + sep = "\t", + dec = "." + ) + layer <- append(layer, "transcriptome") } if (!is.null(args$proteomics)) { - proteome <- read.csv(args$proteomics, - header = TRUE, - sep = "\t", - dec = ".") - layer <- append(layer, "proteome") + proteome <- read.csv(args$proteomics, + header = TRUE, + sep = "\t", + dec = "." + ) + layer <- append(layer, "proteome") } if (!is.null(args$metabolomics)) { - metabolome <- read.csv(args$metabolomics, - header = TRUE, - sep = "\t", - dec = ".") - layer <- append(layer, "metabolome") + metabolome <- read.csv(args$metabolomics, + header = TRUE, + sep = "\t", + dec = "." + ) + layer <- append(layer, "metabolome") } ## ----rank_features------------------------------------------------------------ @@ -103,70 +119,76 @@ ## add transcriptome layer if (!is.null(args$transcriptomics)) { - omics_data$transcriptome <- rankFeatures(transcriptome$logFC, - transcriptome$pValue) - names(omics_data$transcriptome) <- transcriptome$Symbol + omics_data$transcriptome <- rankFeatures( + transcriptome$logFC, + transcriptome$pValue + ) + names(omics_data$transcriptome) <- transcriptome$Symbol } ## add proteome layer if (!is.null(args$proteomics)) { - omics_data$proteome <- rankFeatures(proteome$logFC, proteome$pValue) - names(omics_data$proteome) <- proteome$Symbol + omics_data$proteome <- rankFeatures(proteome$logFC, proteome$pValue) + names(omics_data$proteome) <- proteome$Symbol } ## add metabolome layer ## HMDB features have to be updated to the new HMDB format if (!is.null(args$metabolomics)) { - omics_data$metabolome <- - rankFeatures(metabolome$logFC, metabolome$pValue) - names(omics_data$metabolome) <- metabolome$HMDB - names(omics_data$metabolome) <- gsub("HMDB", "HMDB00", - names(omics_data$metabolome)) + omics_data$metabolome <- + rankFeatures(metabolome$logFC, metabolome$pValue) + names(omics_data$metabolome) <- metabolome$HMDB + names(omics_data$metabolome) <- gsub( + "HMDB", "HMDB00", + names(omics_data$metabolome) + ) } ## remove NA's and sort feature ranks omics_data <- lapply(omics_data, function(vec) { - sort(vec[!is.na(vec)]) + sort(vec[!is.na(vec)]) }) ## ----Pathway definitions------------------------------------------------------ pathways <- - getMultiOmicsFeatures( - dbs = unlist(strsplit(args$databases, ",", fixed = TRUE)), - layer = layer, - returnTranscriptome = args$transcriptome_ids, - returnProteome = args$proteome_ids, - returnMetabolome = args$metabolome_ids, - organism = args$organism, - useLocal = FALSE - ) + getMultiOmicsFeatures( + dbs = unlist(strsplit(args$databases, ",", fixed = TRUE)), + layer = layer, + returnTranscriptome = args$transcriptome_ids, + returnProteome = args$proteome_ids, + returnMetabolome = args$metabolome_ids, + organism = args$organism, + useLocal = FALSE + ) ## ----calculate enrichment----------------------------------------------------- enrichment_scores <- - multiGSEA(pathways, omics_data) + multiGSEA(pathways, omics_data) ## ----combine_pvalues---------------------------------------------------------- -df <- extractPvalues(enrichmentScores = enrichment_scores, - pathwayNames = names(pathways[[1]])) +df <- extractPvalues( + enrichmentScores = enrichment_scores, + pathwayNames = names(pathways[[1]]) +) df$combined_pval <- - combinePvalues(df, method = args$combine_pvalues) + combinePvalues(df, method = args$combine_pvalues) df$combined_padj <- - p.adjust(df$combined_pval, method = args$padj_method) + p.adjust(df$combined_pval, method = args$padj_method) df <- cbind(data.frame(pathway = names(pathways[[1]])), df) ## ----Write output------------------------------------------------------------- write.table( - df, - file = "results.tsv", - quote = FALSE, - sep = "\t", - col.names = TRUE, - row.names = FALSE + df, + file = "results.tsv", + quote = FALSE, + sep = "\t", + col.names = TRUE, + row.names = FALSE )
--- a/multigsea.xml Wed Jun 07 19:48:35 2023 +0000 +++ b/multigsea.xml Fri Feb 28 10:25:26 2025 +0000 @@ -101,15 +101,14 @@ <option value="dmelanogaster">Drosophila melanogaster (Fruit fly)</option> <option value="celegans">Caenorabditis elegans (Roundworm)</option> </param> - <param name="databases" type="select" multiple="true" label="Pathway databases" help="Available pathway databases"> - <option value="all" selected="true">All available databases</option> - <option value="kegg">KEGG</option> - <option value="reactome">REACTOME</option> - <option value="wikipathways">WIKIPATHWAYS</option> - <option value="pathbank">PATHBANK</option> - <option value="smpdb">SMPDB (Human only)</option> - <option value="panther">PANTHER (Human only)</option> - <option value="pharmgkb">PHARMGKB (Human only)</option> + <param name="databases" type="select" multiple="true" optional="false" label="Pathway databases" help="Available pathway databases"> + <option value="kegg" selected="true">KEGG</option> + <option value="reactome" selected="true">REACTOME</option> + <option value="wikipathways" selected="true">WIKIPATHWAYS</option> + <option value="pathbank" selected="true">PATHBANK</option> + <option value="smpdb">SMPDB (Human only)</option> + <option value="panther">PANTHER (Human only)</option> + <option value="pharmgkb">PHARMGKB (Human only)</option> </param> <param name="combine_pvalues" type="select" label="Combine p-values method" help="It specifies the method to combine multiple p-values "> <option value="stouffer">Stouffer</option> @@ -144,6 +143,8 @@ <output name="output"> <assert_contents> <has_size value="43574" delta="300"/> + <has_n_lines n="327"/> + <has_n_columns n="9"/> <has_text text="Ubiquinone and other terpenoid-quinone biosynthesis"/> </assert_contents> </output> @@ -171,7 +172,8 @@ </conditional> <output name="output"> <assert_contents> - <has_size value="42541" delta="300"/> + <has_n_lines n="327"/> + <has_n_columns n="9"/> <has_text text="Ubiquinone and other terpenoid-quinone biosynthesis"/> </assert_contents> </output>
