comparison pick_open_reference_otus.xml @ 0:c1bd0c560018 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/qiime commit bcbe76277f3e60303faf826f8ce7f018bc663a9a-dirty
author bebatut
date Tue, 02 Feb 2016 05:50:37 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:c1bd0c560018
1 <tool id="pick_open_reference_otus" name="Perform open-reference OTU picking"
2 version="1.9.1">
3
4 <description></description>
5
6 <macros>
7 <import>macros.xml</import>
8 </macros>
9
10 <expand macro="requirements" />
11
12 <version_command><![CDATA[
13 pick_open_reference_otus.py --version
14 ]]></version_command>
15
16 <command><![CDATA[
17 pick_open_reference_otus.py
18
19 -i $input_seq_files
20
21 -o otus
22
23 -m $otu_picking_method
24
25 #if str( $reference_sequences.reference_sequences_selector ) == 'history'
26 #set $ref = $reference_sequences.history_database
27 #else:
28 #set $data_table = dict([(_[0], _[2]) for _ in $reference_sequences.cached_database.input.options.tool_data_table.data])
29 #set $db = $reference_sequences.cached_database.value
30 #set $ref = $data_table[$db]
31 #end if
32 -r $ref
33
34 #if $prefilter_refseqs_fp.difference_test
35 #if str( $prefilter_refseqs_fp.prefilter_reference_sequences.reference_sequences_selector ) == 'history'
36 #set $ref = $prefilter_refseqs_fp.prefilter_reference_sequences.history_database
37 #else:
38 #set $data_table = dict([(_[0], _[2]) for _ in $prefilter_refseqs_fp.prefilter_reference_sequences.cached_database.input.options.tool_data_table.data])
39 #set $db = $prefilter_refseqs_fp.prefilter_reference_sequences.cached_database.value
40 #set $ref = $data_table[$db]
41 #end if
42 --prefilter_refseqs_fp $ref
43 #end if
44
45 -n $new_ref_set_id
46
47 $parallel
48 -O "\${GALAXY_SLOTS:-4}"
49
50 -s $percent_subsample
51 --prefilter_percent_id $prefilter_percent_id
52
53 #if str($step1_otu_map_fp) != 'None':
54 --step1_otu_map_fp $step1_otu_map_fp
55 #end if
56
57 #if str($step1_failures_fasta_fp) != 'None':
58 --step1_failures_fasta_fp=$step1_failures_fasta_fp
59 #end if
60
61 --minimum_failure_threshold $minimum_failure_threshold
62
63 $suppress_step4
64
65 --min_otu_size $min_otu_size
66
67 $suppress_taxonomy_assignment
68 $suppress_align_and_tree
69
70 &&
71
72 biom convert
73 -i otus/otu_table_mc2.biom
74 -o $output_otu_table
75 --to-tsv
76 --header-key taxonomy
77
78 #if not $suppress_taxonomy_assignment
79 &&
80 biom convert
81 -i otus/otu_table_mc2_w_tax.biom
82 -o $output_otu_table_taxonomy
83 --to-tsv
84 --header-key taxonomy
85 #end if
86
87 #if not $suppress_align_and_tree
88 &&
89 biom convert
90 -i otus/otu_table_mc_no_pynast_failures.biom
91 -o $output_otu_table_no_failures
92 --to-tsv
93 --header-key taxonomy
94 #end if
95
96 ]]>
97 </command>
98
99 <inputs>
100 <param name="input_seq_files" type="data" format="fasta,fastq"
101 label="Input sequence files" multiple="True" help="(-i/--input_fps)"/>
102
103 <param name="otu_picking_method" label="The OTU picking method to use for
104 reference and de novo steps" type="select"
105 help="-m/--otu_picking_method">
106 <option value="uclust" selected="True">uclust</option>
107 <option value="usearch61">usearch61</option>
108 <option value="sortmerna_sumaclust">sortmerna_sumaclust</option>
109 </param>
110
111 <conditional name="reference_sequences">
112 <param name="reference_sequences_selector" type="select"
113 label="Reference sequences to query"
114 help="(-r, --reference_fp)">
115 <option value="cached" selected="True">Public databases</option>
116 <option value="history">Databases from your history</option>
117 </param>
118 <when value="cached">
119 <param name="cached_database" label="QIIME databases of reference
120 sequences" type="select">
121 <options from_data_table="qiime_reference_db" />
122 </param>
123 </when>
124 <when value="history">
125 <param name="history_database" type="data" format="fasta"
126 label="Reference databases"/>
127 </when>
128 </conditional>
129
130 <conditional name="prefilter_refseqs_fp">
131 <param name="difference_test" type="boolean" label="Use different
132 reference sequences for the prefilter?" checked="False" truevalue="true"
133 falsevalue="false" help="(--prefilter_refseqs_fp)" />
134 <when value="true">
135 <conditional name="prefilter_reference_sequences">
136 <param name="reference_sequences_selector" type="select"
137 label="Reference sequences to query" >
138 <option value="cached" selected="True">Public databases</option>
139 <option value="history">Databases from your history</option>
140 </param>
141 <when value="cached">
142 <param name="cached_database" label="QIIME databases of reference
143 sequences" type="select">
144 <options from_data_table="qiime_reference_db" />
145 </param>
146 </when>
147 <when value="history">
148 <param name="history_database" type="data" format="fasta"
149 label="Reference databases"/>
150 </when>
151 </conditional>
152 </when>
153 <when value="false" />
154 </conditional>
155
156 <param name="new_ref_set_id" type="text" value="New" label="Unique
157 identifier for OTUs that get created in this ref set"
158 help="This is useful to support combining of reference sets
159 (-n/--new_ref_set_id)"/>
160
161 <param name="parallel" type="boolean" label="Run in parallel where
162 available?" truevalue="--parallel" falsevalue="" checked="False"
163 help="(-a, --parallel)" />
164
165 <param name="percent_subsample" type="float" value="0.001" min="0" max="1"
166 label="Percent of failure sequences to include in the subsample to
167 cluster de novo" help="Large numbers should give more comprehensive
168 results but will be slower(-s/--percent_subsample)"/>
169
170 <param name="prefilter_percent_id" type="float" value="0.0" min="0" max="1"
171 label="Percent of sequence pre-cluster against the reference"
172 help="Any reads which fail to hit are discarded (a quality filter)
173 (--prefilter_percent_id)"/>
174
175 <param name="step1_otu_map_fp" type="data" format="txt" label="Reference
176 OTU picking OTU map to avoid rebuilding if one has already been built
177 (optional)" optional="True" help="This must be an OTU map generated
178 by this workflow, not (for example) by pick_closed_reference_otus
179 (--step1_otu_map_fp)" />
180
181 <param name="step1_failures_fasta_fp" type="data" format="fasta"
182 label="Reference OTU picking failures fasta filepath, to avoid
183 rebuilding if one has already been built (optional)" optional="True"
184 help="This must be a failures file generated by this workflow, not
185 (for example) by pick_closed_reference_otus (--step1_failures_fasta_fp)" />
186
187 <param name="minimum_failure_threshold" type="integer" value="100000"
188 label="Minimum number of sequences that must fail to hit the reference
189 for subsampling to be performed" help="If fewer than this number of
190 sequences fail to hit the reference, the de novo clustering step will
191 run serially rather than invoking the subsampled open reference approach
192 to improve performance (--minimum_failure_threshold)"/>
193
194 <param name="suppress_step4" type="boolean" label="Suppress the final de
195 novo OTU picking step?" truevalue="--suppress_step4" falsevalue=""
196 checked="False" help="It may be necessary for extremely large data
197 sets(--suppress_step4)" />
198
199 <param name="min_otu_size" type="integer" value="2" label="Minimum otu
200 size to retain the OTU" help="(--min_otu_size)"/>
201
202 <param name="suppress_taxonomy_assignment" type="boolean"
203 label="Skip the taxonomy assignment step?"
204 truevalue="--suppress_taxonomy_assignment" falsevalue=""
205 checked="False" help="It results in an OTU table without taxonomy
206 (--suppress_taxonomy_assignment)" />
207
208 <param name="suppress_align_and_tree" type="boolean"
209 label="Skip the sequence alignment and tree-building steps?"
210 truevalue="--suppress_align_and_tree" falsevalue=""
211 checked="False" help="(--suppress_align_and_tree)" />
212 </inputs>
213
214 <outputs>
215 <data name="output_rep_set" format="fasta"
216 from_work_dir="otus/rep_set.fna"
217 label="${tool.name} on ${on_string}: OTU representative sequences"/>
218 <data name="output_ref_set" format="fasta"
219 from_work_dir="otus/new_refseqs.fna"
220 label="${tool.name} on ${on_string}: New reference sequences (OTU +
221 input reference sequences)"/>
222 <data name="output_otu_table" format="tsv"
223 label="${tool.name} on ${on_string}: OTU table"/>
224 <data name="output_otu_table_taxonomy" format="tsv"
225 label="${tool.name} on ${on_string}: OTU table with taxonomy">
226 <filter>suppress_taxonomy_assignment is False</filter>
227 </data>
228 <data name="output_otu_table_no_failures" format="tsv"
229 label="${tool.name} on ${on_string}: OTU without sequences that
230 failed to align">
231 <filter>suppress_align_and_tree is False</filter>
232 </data>
233 <data name="output_otu_map" format="txt"
234 from_work_dir="otus/final_otu_map_mc2.txt"
235 label="${tool.name} on ${on_string}: OTU map"/>
236 <data name="output_rep_set_tree" format="txt"
237 from_work_dir="otus/rep_set.tre"
238 label="${tool.name} on ${on_string}: representative set tree">
239 <filter>suppress_align_and_tree is False</filter>
240 </data>
241 </outputs>
242
243 <tests>
244 <test>
245 <param name="input_seq_files"
246 value="split_fastq_libraries_sequences.fasta"/>
247 <param name="otu_picking_method" value="uclust"/>
248 <param name="reference_sequences_selector" value="history"/>
249 <param name="history_database" value="gg_13_8_97_otus.fasta"/>
250 <param name="difference_test" value="false"/>
251 <param name="new_ref_set_id" value="New" />
252 <param name="parallel" value="--parallel"/>
253 <param name="percent_subsample" value="0.001" />
254 <param name="prefilter_percent_id" value="0.0" />
255 <param name="minimum_failure_threshold" value="100000" />
256 <param name="suppress_step4" value=""/>
257 <param name="min_otu_size" value="2" />
258 <param name="suppress_taxonomy_assignment" value="" />
259 <param name="suppress_align_and_tree" value="" />
260
261 <output name="output_rep_set"
262 value="pick_open_reference_otus_representative_sequences.fasta"/>
263 <output name="output_ref_set"
264 value="pick_open_reference_otus_reference_sequences.fasta"/>
265 <output name="output_otu_table"
266 value="pick_open_reference_otus_otu_table.txt"/>
267 <output name="output_otu_table_taxonomy"
268 value="pick_open_reference_otus_otu_table_with_taxo.txt" />
269 <output name="output_otu_map"
270 value="pick_open_reference_otus_otu_map.txt"/>
271 <output name="output_otu_table_no_failures"
272 value="pick_open_reference_otus_otu_table_with_taxo_without_pynast_failure.txt" />
273 <output name="output_rep_set_tree"
274 value="pick_open_reference_otus_representative_set_tree.txt" />
275 </test>
276 </tests>
277
278 <help><![CDATA[
279
280 **What it does**
281
282 This tool performs open-reference OTU picking from sequences.
283
284 This script is broken down into 4 possible OTU picking steps, and 2 steps
285 involving the creation of OTU tables and trees.
286
287 More information about this tool is available on
288 `QIIME documentation <http://qiime.org/scripts/pick_open_reference_otus.html>`_.
289 ]]>
290 </help>
291
292 <citations>
293 <expand macro="citations" />
294 </citations>
295 </tool>