annotate getgo.r @ 5:b79c65c90744 draft

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
author mvdbeek
date Sun, 28 Feb 2016 11:52:10 -0500
parents
children 0e9424413ab0
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
5
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
1 suppressWarnings(suppressMessages(library(goseq)))
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
2 suppressWarnings(suppressMessages(library(optparse)))
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
3 suppressWarnings(suppressMessages(library(rtracklayer)))
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
4 suppressWarnings(suppressMessages(library(reshape2)))
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
5 sink(stdout(), type = "message")
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
6
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
7 option_list <- list(
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
8 make_option(c("-gtf", "--gtf"), type="character", help = "Path to GTF file for which to fetch GO data"),
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
9 make_option(c("-g", "--genome"), type="character", help = "Genome [used for looking up GO categories]"),
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
10 make_option(c("-i", "--gene_id"), type="character", help="Gene ID format"),
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
11 make_option(c("-c", "--cats"), type="character", help="Comma-seperated list of categories to fetch"),
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
12 make_option(c("-o", "--output"), type="character", help="Path to output file")
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
13 )
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
14
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
15 parser <- OptionParser(usage = "%prog [options] file", option_list=option_list)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
16 args = parse_args(parser)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
17
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
18 # Vars:
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
19
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
20 gtf = args$gtf
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
21 genome = args$genome
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
22 gene_id = args$gene_id
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
23 output = args$output
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
24 cats = unlist(strsplit(args$cats, ','))
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
25 genes = unique(import.gff(gtf)$gene_id)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
26 go_categories = getgo(genes, genome, id, fetch.cats=cats)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
27
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
28 # transform go category list to sth. more manipulatable in galaxy
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
29 go_categories <- lapply(go_categories, unlist)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
30 go_categories = goseq:::reversemapping(go_categories)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
31 go_categories = melt(go_categories)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
32 colnames(go_categories) = c("#gene_id", "go_category")
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
33
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
34 write.table(go_categories, output, sep="\t", row.names = FALSE, quote = FALSE)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
35 sessionInfo()