annotate getgo.r @ 6:0e9424413ab0 draft

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
author mvdbeek
date Thu, 03 Mar 2016 09:56:51 -0500
parents b79c65c90744
children 04b9c519d3e1
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
1 options( show.error.messages=F, error = function () { cat( geterrmessage(), file=stderr() ); q( "no", 1, F ) } )
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
2
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
3 # we need that to not crash galaxy with an UTF8 error on German LC settings.
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
4 loc <- Sys.setlocale("LC_MESSAGES", "en_US.UTF-8")
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
5
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
6 suppressPackageStartupMessages({
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
7 library("goseq")
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
8 library("optparse")
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
9 library("rtracklayer")
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
10 library("reshape2")
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
11 })
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
12
5
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
13 sink(stdout(), type = "message")
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
14
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
15 option_list <- list(
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
16 make_option(c("-gtf", "--gtf"), type="character", help = "Path to GTF file for which to fetch GO data"),
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
17 make_option(c("-g", "--genome"), type="character", help = "Genome [used for looking up GO categories]"),
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
18 make_option(c("-i", "--gene_id"), type="character", help="Gene ID format"),
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
19 make_option(c("-c", "--cats"), type="character", help="Comma-seperated list of categories to fetch"),
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
20 make_option(c("-o", "--output"), type="character", help="Path to output file")
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
21 )
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
22
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
23 parser <- OptionParser(usage = "%prog [options] file", option_list=option_list)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
24 args = parse_args(parser)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
25
6
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
26 # vars
5
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
27
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
28 gtf = args$gtf
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
29 genome = args$genome
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
30 gene_id = args$gene_id
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
31 output = args$output
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
32 cats = unlist(strsplit(args$cats, ','))
6
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
33
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
34 # retrieve and transform data
5
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
35 genes = unique(import.gff(gtf)$gene_id)
6
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
36 go_categories = getgo(genes, genome, gene_id, fetch.cats=cats)
5
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
37 go_categories = goseq:::reversemapping(go_categories)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
38 go_categories = melt(go_categories)
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
39
6
0e9424413ab0 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit f95b47ed1a09ce14d3b565e8ea56d8bf12c35814-dirty
mvdbeek
parents: 5
diff changeset
40 write.table(go_categories, output, sep="\t", col.names = FALSE, row.names = FALSE, quote = FALSE)
5
b79c65c90744 planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/goseq_1_22_0 commit 81aedf1b50849160f6c048c0da4bb1038bb813a5
mvdbeek
parents:
diff changeset
41 sessionInfo()