annotate extract_genomic_dna.xml @ 0:cff5b7c9be55 draft

Uploaded
author greg
date Thu, 14 Jan 2016 07:55:22 -0500
parents
children 311febbd33d6
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
1 <tool id="Extract genomic DNA 1" name="Extract Genomic DNA" version="3.0.0">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
2 <description>using coordinates from assembled/unassembled genomes</description>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
3 <command>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
4 <![CDATA[
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
5 #set input_format $input_format_cond.input_format
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
6 #set input $input_format_cond.input
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
7 #set dbkey = $input.metadata.dbkey
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
8 #set datatype = $input.datatype
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
9 mkdir -p output_dir &&
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
10 python $__tool_directory__/extract_genomic_dna.py
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
11 --input_format $input_format
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
12 --input "$input"
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
13 --dbkey $dbkey
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
14 #if str($input_format) == "gff":
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
15 --interpret_features $input_format_cond.interpret_features
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
16 #end if
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
17 #if isinstance($datatype, $__app__.datatypes_registry.get_datatype_by_extension('gff').__class__):
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
18 --columns "1,4,5,7"
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
19 #else:
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
20 --columns "${input.metadata.chromCol},${input.metadata.startCol},${input.metadata.endCol},${input.metadata.strandCol},${input.metadata.nameCol}"
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
21 #end if
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
22 --reference_genome_source $reference_genome_cond.reference_genome_source
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
23 #if str($reference_genome_cond.reference_genome_source) == "cached"
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
24 --reference_genome $reference_genome_cond.reference_genome.fields.path
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
25 #else:
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
26 --reference_genome $reference_genome_cond.reference_genome
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
27 #end if
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
28 --output_format $output_format
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
29 --output $output
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
30 ]]>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
31 </command>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
32 <inputs>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
33 <conditional name="input_format_cond">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
34 <param name="input_format" type="select" label="Input file format">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
35 <option value="gff" selected="True">Gff</option>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
36 <option value="interval">Interval</option>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
37 </param>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
38 <when value="gff">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
39 <param name="input" type="data" format="gff" label="Fetch sequences for intervals in">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
40 <validator type="unspecified_build" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
41 </param>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
42 <param name="interpret_features" type="select" label="Interpret features when possible">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
43 <option value="yes">Yes</option>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
44 <option value="no">No</option>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
45 </param>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
46 </when>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
47 <when value="interval">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
48 <param name="input" type="data" format="interval" label="Fetch sequences for intervals in">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
49 <validator type="unspecified_build" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
50 </param>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
51 </when>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
52 </conditional>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
53 <conditional name="reference_genome_cond">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
54 <param name="reference_genome_source" type="select" label="Choose the source for the reference genome">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
55 <option value="cached">locally cached</option>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
56 <option value="history">from history</option>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
57 </param>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
58 <when value="cached">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
59 <param name="reference_genome" type="select" label="Using reference genome">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
60 <options from_data_table="alignseq_seq">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
61 <filter type="data_meta" key="dbkey" ref="input" column="dbkey"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
62 </options>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
63 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
64 </param>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
65 </when>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
66 <when value="history">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
67 <param name="reference_genome" type="data" format="fasta" label="Using reference genome">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
68 <options>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
69 <filter type="data_meta" key="dbkey" ref="input_bam" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
70 </options>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
71 <validator type="no_options" message="The current history does not include a fasta dataset with the build associated with the selected input file"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
72 </param>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
73 </when>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
74 </conditional>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
75 <param name="output_format" type="select" label="Select output format">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
76 <option value="fasta" selected="True">fasta</option>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
77 <option value="interval">interval</option>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
78 </param>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
79 </inputs>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
80 <outputs>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
81 <data name="output" format="gff">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
82 <change_format>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
83 <when output_format="interval" format="interval" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
84 </change_format>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
85 </data>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
86 </outputs>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
87 <tests>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
88 <test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
89 <param name="input" value="1.bed" dbkey="hg17" ftype="bed" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
90 <param name="interpret_features" value="yes"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
91 <param name="index_source" value="cached"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
92 <param name="out_format" value="fasta"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
93 <output name="out_file1">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
94 <assert_contents>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
95 <!-- First few lines... -->
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
96 <has_text text=">hg17_chr1_147962192_147962580_- CCDS989.1_cds_0_0_chr1_147962193_r" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
97 <has_text text="ACTTGATCCTGCTCCCTCGGTGTCTGCATTGACTCCTCATGCTGGGACTG" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
98 <has_text text="GACCCGTCAACCCCCCTGCTCGCTGCTCACGTACCTTCATCACTTTTAGT" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
99 <has_text text="GATGATGCAACTTTCGAGGAATGGTTCCCCCAAGGGCGGCCCCCAAAAGT" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
100 <!-- Last few lines... -->
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
101 <has_text text="GCTGTGGCACAGAACATGGACTCTGTGTTTAAGGAGCTCTTGGGAAAGAC" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
102 <has_text text="CTCTGTCCGCCAGGGCCTTGGGCCAGCATCTACCACCTCTCCCAGTCCTG" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
103 <has_text text="GGCCCCGAAGCCCAAAGGCCCCGCCCAGCAGCCGCCTGGGCAGGAACAAA" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
104 <has_text text="GGCTTCTCCCGGGGCCCTGGGGCCCCAGCCTCACCCTCAGCTTCCCACCC" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
105 <has_text text="CCAGGGCCTAGACACGACCCCCAAGCCACACTGA" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
106 </assert_contents>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
107 </output>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
108 </test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
109 <test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
110 <param name="input" value="droPer1.bed" dbkey="droPer1" ftype="bed" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
111 <param name="interpret_features" value="yes"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
112 <param name="index_source" value="cached"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
113 <param name="out_format" value="fasta"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
114 <output name="out_file1" file="extract_genomic_dna_out2.fasta" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
115 </test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
116 <test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
117 <param name="input" value="1.bed" dbkey="hg17" ftype="bed" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
118 <param name="interpret_features" value="yes"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
119 <param name="index_source" value="cached"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
120 <param name="out_format" value="interval"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
121 <output name="out_file1" file="extract_genomic_dna_out3.interval" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
122 </test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
123 <!-- Test GFF file support. -->
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
124 <test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
125 <param name="input" value="gff_filter_by_attribute_out1.gff" dbkey="mm9" ftype="gff" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
126 <param name="interpret_features" value="no"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
127 <param name="index_source" value="cached"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
128 <param name="out_format" value="interval"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
129 <output name="out_file1" file="extract_genomic_dna_out4.gff" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
130 </test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
131 <test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
132 <param name="input" value="gff_filter_by_attribute_out1.gff" dbkey="mm9" ftype="gff" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
133 <param name="interpret_features" value="no"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
134 <param name="out_format" value="fasta"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
135 <param name="index_source" value="cached"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
136 <output name="out_file1" file="extract_genomic_dna_out5.fasta" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
137 </test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
138 <!-- Test custom sequences support and GFF feature interpretation. -->
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
139 <test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
140 <param name="input" value="cufflinks_out1.gtf" dbkey="mm9" ftype="gff" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
141 <param name="interpret_features" value="no"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
142 <param name="index_source" value="history"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
143 <param name="ref_file" value="tophat_in1.fasta"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
144 <param name="out_format" value="fasta"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
145 <output name="out_file1" file="extract_genomic_dna_out6.fasta" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
146 </test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
147 <test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
148 <param name="input" value="cufflinks_out1.gtf" dbkey="mm9" ftype="gff" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
149 <param name="interpret_features" value="yes"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
150 <param name="index_source" value="history"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
151 <param name="ref_file" value="tophat_in1.fasta"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
152 <param name="out_format" value="fasta"/>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
153 <output name="out_file1" file="extract_genomic_dna_out7.fasta" />
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
154 </test>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
155 </tests>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
156 <help>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
157
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
158 .. class:: warningmark
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
159
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
160 The following will cause a line from the input dataset to be skipped and a warning generated.
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
161
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
162 - Sequences that fall outside of the range of a line's start and end coordinates.
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
163 - Chromosome start or end coordinates that are invalid for the specified build.
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
164
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
165 -----
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
166
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
167 **What it does**
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
168
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
169 This tool uses coordinate, strand, and build information to fetch genomic DNA from gff data, producing fasta data.
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
170
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
171 -----
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
172
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
173 **Example**
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
174
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
175 If the input dataset is::
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
176
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
177 chr7 127475281 127475310 NM_000230 0 +
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
178 chr7 127485994 127486166 NM_000230 0 +
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
179 chr7 127486011 127486166 D49487 0 +
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
180
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
181 Extracting sequences returns::
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
182
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
183 &gt;hg17_chr7_127475281_127475310_+ NM_000230
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
184 GTAGGAATCGCAGCGCCAGCGGTTGCAAG
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
185 &gt;hg17_chr7_127485994_127486166_+ NM_000230
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
186 GCCCAAGAAGCCCATCCTGGGAAGGAAAATGCATTGGGGAACCCTGTGCG
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
187 GATTCTTGTGGCTTTGGCCCTATCTTTTCTATGTCCAAGCTGTGCCCATC
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
188 CAAAAAGTCCAAGATGACACCAAAACCCTCATCAAGACAATTGTCACCAG
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
189 GATCAATGACATTTCACACACG
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
190 &gt;hg17_chr7_127486011_127486166_+ D49487
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
191 TGGGAAGGAAAATGCATTGGGGAACCCTGTGCGGATTCTTGTGGCTTTGG
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
192 CCCTATCTTTTCTATGTCCAAGCTGTGCCCATCCAAAAAGTCCAAGATGA
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
193 CACCAAAACCCTCATCAAGACAATTGTCACCAGGATCAATGACATTTCAC
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
194 ACACG
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
195
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
196 </help>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
197 <citations>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
198 <citation type="bibtex">
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
199 @unpublished{None,
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
200 author = {},
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
201 title = {None},
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
202 year = {None},
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
203 eprint = {None},
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
204 url = {http://www.bx.psu.edu/~anton/labSite/}
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
205 }</citation>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
206 </citations>
cff5b7c9be55 Uploaded
greg
parents:
diff changeset
207 </tool>