annotate venn_list-c96bef0643dc/tools/plotting/venn_list.xml @ 1:116ccf1c84d5 draft

Uploaded v0.0.5
author peterjc
date Thu, 16 May 2013 12:37:09 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
1 <tool id="venn_list" name="Venn Diagram" version="0.0.3">
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
2 <description>from lists</description>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
3 <command interpreter="python">
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
4 venn_list.py
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
5 #if $universe.type_select=="implicit":
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
6 - -
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
7 #else:
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
8 $main $main.ext
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
9 #end if
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
10 "$main_lab"
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
11 #for $s in $sets:
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
12 $s.set $s.set.ext "$s.lab"
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
13 #end for
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
14 $PDF</command>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
15 <inputs>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
16 <param name="main_lab" size="30" type="text" value="Venn Diagram" label="Plot title"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
17 <conditional name="universe">
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
18 <param name="type_select" type="select" label="Implicit or explicit full ID list?">
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
19 <option value="explicit">Explicit</option>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
20 <option value="implicit">Implicit (use union of sets below)</option>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
21 </param>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
22 <when value="explicit">
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
23 <param name="main" type="data" format="tabular,fasta,fastq,sff" label="Full dataset (with all identifiers)" help="Tabular file (uses column one), FASTA, FASTQ or SFF file."/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
24 </when>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
25 <when value="implicit"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
26 </conditional>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
27 <repeat name="sets" min="1" max="3" title="Sets">
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
28 <param name="set" type="data" format="tabular,fasta,fastq,sff" label="Members of set" help="Tabular file (uses column one), FASTA, FASTQ or SFF file."/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
29 <param name="lab" size="30" type="text" value="Group" label="Caption for set"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
30 </repeat>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
31 </inputs>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
32 <outputs>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
33 <data format="pdf" name="PDF" />
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
34 </outputs>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
35 <requirements>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
36 <requirement type="python-module">rpy</requirement>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
37 <requirement type="python-module">Bio</requirement>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
38 </requirements>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
39 <tests>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
40 <!-- Doesn't seem to work properly, manages to get two sets, both
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
41 with same FASTA file, but second with default "Group" label.
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
42 <test>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
43 <param name="type_select" value="explicit"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
44 <param name="main" value="venn_list.tabular" ftype="tabular"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
45 <param name="main_lab" value="Some Proteins"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
46 <param name="set" value="rhodopsin_proteins.fasta"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
47 <param name="lab" value="Rhodopsins"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
48 <output name="PDF" file="venn_list1.pdf" ftype="pdf"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
49 </test>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
50 -->
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
51 <!-- Can't use more than one repeat value in tests (yet)
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
52 <test>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
53 <param name="type_select" value="explicit"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
54 <param name="main" value="venn_list.tabular" ftype="tabular"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
55 <param name="main_lab" value="Some Proteins"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
56 <param name="count" value="3"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
57 <param name="set" value="rhodopsin_proteins.fasta"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
58 <param name="lab" value="Rhodopsins"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
59 <param name="set" value="four_human_proteins.fasta"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
60 <param name="lab" value="Human"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
61 <param name="set" value="blastp_four_human_vs_rhodopsin.tabular"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
62 <param name="lab" value="Human vs Rhodopsin BLAST"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
63 <output name="PDF" file="venn_list3.pdf" ftype="pdf"/>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
64 </test>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
65 -->
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
66 </tests>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
67 <help>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
68
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
69 .. class:: infomark
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
70
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
71 **TIP:** If your data is in tabular files, the identifier is assumed to be in column one.
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
72
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
73 **What it does**
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
74
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
75 Draws Venn Diagram for one, two or three sets (as a PDF file).
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
76
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
77 You must supply one, two or three sets of identifiers -- corresponding
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
78 to one, two or three circles on the Venn Diagram.
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
79
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
80 In general you should also give the full list of all the identifiers
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
81 explicitly. This is used to calculate the number of identifers outside
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
82 the circles (and check the identifiers in the other files match up).
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
83 The full list can be omitted by implicitly taking the union of the
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
84 category sets. In this case, the count outside the categories (circles)
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
85 will always be zero.
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
86
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
87 The identifiers can be taken from the first column of a tabular file
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
88 (e.g. query names in BLAST tabular output, or signal peptide predictions
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
89 after filtering, etc), or from a sequence file (FASTA, FASTQ, SFF).
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
90
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
91 For example, you may have a set of NGS reads (as a FASTA, FASTQ or SFF
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
92 file), and the results of several different read mappings (e.g. to
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
93 different references) as tabular files (filtered to have just the mapped
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
94 reads). You could then show the different mappings (and their overlaps)
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
95 as a Venn Diagram, and the outside count would be the unmapped reads.
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
96
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
97 **Citations**
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
98
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
99 The Venn Diagrams are drawn using Gordon Smyth's limma package from
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
100 R/Bioconductor, http://www.bioconductor.org/
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
101
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
102 The R library is called from Python via rpy, http://rpy.sourceforge.net/
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
103
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
104 This tool uses Biopython to read SFF files. If you use this tool with
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
105 SFF files in scientific work leading to a publication, please cite the
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
106 Biopython application note:
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
107
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
108 Cock et al 2009. Biopython: freely available Python tools for computational
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
109 molecular biology and bioinformatics. Bioinformatics 25(11) 1422-3.
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
110 http://dx.doi.org/10.1093/bioinformatics/btp163 pmid:19304878.
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
111
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
112 </help>
116ccf1c84d5 Uploaded v0.0.5
peterjc
parents:
diff changeset
113 </tool>