annotate gemini_annotate.xml @ 0:c30f03974122 draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
author iuc
date Tue, 29 Dec 2015 10:22:54 -0500
parents
children 54f607ff195b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
1 <tool id="gemini_@BINARY@" name="GEMINI @BINARY@" version="@VERSION@.0">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
2 <description>adding your own custom annotations</description>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
3 <macros>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
4 <import>gemini_macros.xml</import>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
5 <token name="@BINARY@">annotate</token>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
6 </macros>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
7 <expand macro="requirements" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
8 <expand macro="stdio" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
9 <expand macro="version_command" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
10 <command>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
11 <![CDATA[
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
12
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
13 bgzip -c $annotate_source > tabixed.gz;
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
14 tabix -p bed tabixed.gz;
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
15
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
16 gemini @BINARY@
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
17 -f tabixed.gz
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
18 -c $column_name
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
19 -a $a.a_selector
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
20 #if $a.a_selector == 'extract':
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
21 -t $a.column_type
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
22 -e $a.column_extracts
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
23 -o $a.operation
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
24 #end if
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
25 $region_only
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
26 "${ infile }"
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
27 > "${ outfile }"
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
28 ]]>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
29
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
30 </command>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
31 <inputs>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
32 <expand macro="infile" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
33 <param name="annotate_source" type="data" format="bed" label="File containing the annotations in BED format" help="(-f)"/>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
34
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
35 <param name="column_name" type="text" value=""
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
36 label="The name of the column to be added to the variant table"
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
37 help=" If the input file is a VCF, then this is the name of the info field to pull. (-c)">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
38 <sanitizer invalid_char=" ">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
39 <valid initial="string.letters,string.digits">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
40 <add value="_" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
41 </valid>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
42 </sanitizer>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
43 </param>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
44 <conditional name="a">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
45 <param name="a_selector" type="select" label="How should the annotation file be used?" help="(-a)">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
46 <option value="boolean">Did a variant overlap a region or not? (boolean)</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
47 <option value="count">How many regions did a variant overlap? (count)</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
48 <option value="extract" selected="True">Extract specific values from a BED file. (extract)</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
49 </param>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
50 <when value="extract">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
51
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
52 <param name="column_extracts" label="Column to extract information from for list annotations"
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
53 type="data_column" data_ref="annotate_source" force_select="true" help="(-e)"/>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
54
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
55
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
56 <param name="column_type" type="select" label="What data type(s) should be used to represent the new values in the database?"
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
57 help="(-t)">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
58 <option value="float">Decimal precision number (float)</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
59 <option value="integer">Integer number (integer)</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
60 <option value="text">Text columns such as “valid”, “yes” (text)</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
61 </param>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
62
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
63 <param name="operation" type="select" label="Operation to apply to the extract column values ..."
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
64 help="in the event that a variant overlaps multiple annotations in your annotation file. (-o)">
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
65 <option value="mean">Compute the average of the (numeric) values</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
66 <option value="sum">Compute the sum of the (numeric) values</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
67 <option value="median">Compute the median of the (numeric) values</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
68 <option value="mix">Compute the minimum of the (numeric) values</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
69 <option value="max">Compute the maximum of the (numeric) values</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
70 <option value="mode">Compute the maximum of the (numeric) values</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
71 <option value="first">Use the value from the first record in the annotation file</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
72 <option value="last">Use the value from the last record in the annotation file</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
73 <option value="list">Create a comma-separated list of the observed (text) values</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
74 <option value="uniq_list">Create a comma-separated list of non-redundant observed (text) values</option>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
75 </param>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
76
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
77 </when>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
78 <when value="boolean"/>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
79 <when value="count"/>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
80 </conditional>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
81 <param name="region_only" argument="--region-only" type="boolean" checked="false"
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
82 truevalue="--region-only" falsevalue=""
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
83 label="If set, only region coordinates will be considered when annotating variants."
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
84 help="The default is to annotate using region coordinates as well as REF and ALT
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
85 variant values. This option is only valid if annotation is a VCF file"/>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
86 </inputs>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
87 <outputs>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
88 <data name="outfile" format="tabular" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
89 </outputs>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
90 <tests>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
91 <test>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
92 <param name="infile" value="gemini_annotate_input.db" ftype="gemini.sqlite" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
93 <param name="annotate_source" value="anno.bed" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
94 <param name="a_selector" value="count" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
95 <param name="column_name" value="anno5" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
96 <output name="outfile" file="gemini_annotate_result.tabular" />
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
97 </test>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
98 </tests>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
99 <help><![CDATA[
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
100 **What it does**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
101
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
102 It is inevitable that researchers will want to enhance the GEMINI framework with their own, custom annotations. GEMINI provides a sub-command called annotate for exactly this purpose.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
103
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
104 **Details**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
105
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
106 It is inevitable that researchers will want to enhance the GEMINI framework with their own, custom annotations. GEMINI provides a sub-command called annotate for exactly this purpose. As long as you provide a tabix‘ed annotation file in BED or VCF format, the annotate tool will, for each variant in the variants table, screen for overlaps in your annotation file and update a one or more new column in the variants table that you may specify on the command line. This is best illustrated by a following **example**.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
107
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
108 **Input files**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
109
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
110 Let’s assume you have already created a GEMINI database of a **VCF file** using the *load module*.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
111
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
112 Now, let’s imagine you have an annotated file in **BED format** (important.bed) that describes regions of the genome that are particularly relevant to your lab’s research. You would like to annotate in the GEMINI database which variants overlap these crucial regions. We want to store this knowledge in a new column in the variants table called important_variant that tracks whether a given variant overlapped (1) or did not overlap (0) intervals in your annotation file.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
113
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
114 *To do this, you must first TABIX your BED file*
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
115
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
116 **-a boolean - Did a variant overlap a region or not?**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
117
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
118 Now, you can use this *TABIX*’ed file to annotate which variants overlap your important regions. In the example below, the results will be stored in a new column called “important”. The **-t boolean** option says that you just want to track whether (1) or not (0) the variant overlapped one or more of your regions.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
119
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
120 Since a new columns has been created in the database, we can now directly query the new column. In the example results below, the first and third variants overlapped a crucial region while the second did not::
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
121
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
122 chr22 100 101 1 1
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
123 chr22 200 201 2 0
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
124 chr22 300 500 3 1
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
125
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
126 **-a count - How many regions did a variant overlap?**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
127
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
128 Instead of a simple yes or no, we can use the **-t count** option to count how many important regions a variant overlapped. It turns out that the 3rd variant actually overlapped two important regions::
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
129
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
130 chr22 100 101 1 1
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
131 chr22 200 201 2 0
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
132 chr22 300 500 3 2
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
133
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
134 **-a extract - Extract specific values from a BED file**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
135
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
136 Lastly, we may also extract values from specific fields in a BED file (or from the INFO field in a VCF) and populate one or more new columns in the database based on overlaps with the annotation file and the values of the fields therein. To do this, we use the **-a extract** option.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
137
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
138 This is best described with an example. To set this up, let’s imagine that we have a VCF file from a different experiment and we want to annotate the variants in our GEMINI database with the allele frequency and depth tags from the INFO fields for the same variants in this other VCF file.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
139
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
140 Now that we have a proper *TABIX*’ed VCF file, we can use the **-a extract** option to populate new columns in the GEMINI database. In order to do so, we must specify:
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
141
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
142 1) its type (e.g., text, int, float,) (**-t**)
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
143 2) the field in the INFO column of the VCF file that we should use to extract data with which to populate the new column (**-e**)
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
144 3) what operation should be used to summarize the data in the event of multiple overlaps in the annotation file (**-o**)
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
145 4) (optionally) the name of the column we want to add (**-c**), if this is not specified, it will use the value from **-e**.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
146
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
147 For example, let’s imagine we want to create a new column called “other_allele_freq” (**-c**) using the AF field in our VCF file to populate it.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
148
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
149 This create a new column in my.db called other_allele_freq and this new column will be a FLOAT (**-t float**). In the event of multiple records in the VCF file overlapping a variant in the database, the average (**-o mean**) of the allele frequencies values from the VCF file will be used.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
150
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
151 At this point, one can query the database based on the values of the new other_allele_freq column (using **GEMINI query**).
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
152
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
153 **-t TYPE - Specifying the column type(s) when using -a extract**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
154
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
155 The annotate tool will create three different types of columns via the **-t** option:
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
156
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
157 1) Floating point columns for annotations with decimal precision as above (-t float)
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
158 2) Integer columns for integral annotations (-t integer)
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
159 3) Text columns for string columns such as “valid”, “yes”, etc. (-t text)
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
160
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
161 *The -t option is only valid when using the -a extract option.*
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
162
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
163 **-o OPERATION - Specifying the summary operations when using -a extract**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
164
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
165 In the event of multiple overlaps between a variant and records in the annotation file, the annotate tool can summarize the values observed with multiple options:
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
166
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
167 - -o mean Compute the average of the values. They must be numeric.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
168 - -o median Compute the median of the values. They must be numeric.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
169 - -o mix Compute the minimum of the values. They must be numeric.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
170 - -o max Compute the maximum of the values. They must be numeric.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
171 - -o mode Compute the maximum of the values. They must be numeric.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
172 - -o first Use the value from the first record in the annotation file.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
173 - -o last Use the value from the last record in the annotation file.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
174 - -o list Create a comma-separated list of the observed values.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
175 - -o uniq_list Create a comma-separated list of the distinct observed values.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
176 - -o sum Compute the sum of the values. They must be numeric.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
177
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
178 The -o option is only valid when using the -a extract option.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
179
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
180 **Annotating with VCF**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
181
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
182 Most of the examples to this point have pulled a column from a tabix indexed bed file. It is likewise possible to pull from the INFO field of a tabix index VCF. The syntax is identical but the **-e** operation will specify the names of fields in the INFO column to pull. By default, those names will be used, but that can still be specified with the **-c column**.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
183
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
184 To put a DP column in the db, set:
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
185
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
186 -o list, -e DP, -t integer
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
187
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
188 ... and name it 'depth', set:
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
189
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
190 -o list, -e DP, -c depth, -t integer
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
191
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
192
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
193 Missing values are allowed since we expect that in some cases an annotation VCF will not have all INFO fields specified for all variants.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
194
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
195 *We recommend decomposing and normalizing variants before annotating. See Step 1. split, left-align, and trim variants for a detailed explanation of how to do this. To do that see the GEMINI* preprocessing_ *website.*
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
196
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
197 **Extracting and populating multiple columns at once**
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
198
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
199 One can also extract and populate multiple columns at once by providing comma-separated lists (no spaces) of column names (**-c**), types (**-t**), numbers (**-e**), and summary operations (**-o**). For example, recall that in the VCF example above, we created a *TABIX*’ed BED file containg the allele frequency and depth values from the INFO field as the 4th and 5th columns in the BED, respectively.
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
200
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
201 Instead of running the annotate tool twice (once for each column), we can run the tool once and load both columns in the same run. For example with settings:
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
202
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
203 - -a extract
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
204 - -c other_allele_freq,other_depth
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
205 - -t float,integer
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
206 - -e 4,5
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
207 - -o mean,max
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
208
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
209 We can then use each of the new columns to filter variants with a *GEMINI query*:
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
210
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
211 .. _preprocessing: https://gemini.readthedocs.org/en/latest/content/preprocessing.html#preprocess
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
212
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
213 ]]></help>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
214 <expand macro="citations"/>
c30f03974122 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/gemini commit e88029bb12e5262687267293f9d2a694eb00d3f0-dirty
iuc
parents:
diff changeset
215 </tool>