comparison disco.xml @ 0:3c16cb5b2b5b draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/disco/ commit c1327b5793477da611684e92e0ce4635370c7666
author iuc
date Fri, 03 Nov 2017 15:44:00 -0400
parents
children 56b0772e3379
comparison
equal deleted inserted replaced
-1:000000000000 0:3c16cb5b2b5b
1 <tool id="disco" name="DISCO" version="@WRAPPER_VERSION@.0">
2 <description>to assemble metagenomics data using an overlap-layout-consensus (OLC) approach</description>
3 <macros>
4 <token name="@WRAPPER_VERSION@">1.2</token>
5 <xml name="assembly_params">
6 <param argument="minSequenceLengthTobePrinted" type="integer" value="1000" min="0" label="Minimum length of contigs or scaffolds to be printed"/>
7 <param argument="MinOverlap4SimplifyGraph" type="integer" value="30" min="0" label="Minimum overlap length (bp) required to keep an edge between two reads during graph simplification" help="This minimum overlap length must be equal to 30 or larger than the MinOverlap4BuildGraph above. This allows you to try different minimum overlap lengths for assembly without redoing assembly graph construction. Edges with shorter overlap length than this parameter will be ignored during graph simplification. Increase this to reduce N50 and mis-assemblies"/>
8 <param argument="minOverlapDifference4ClipBranches" type="integer" value="25" min="0" label="Minimum overlap length difference (bp) to clip branches" help="If a read has multiple edges, Disco clips the branches with overlap lengths less than the largest overlap of this read by this difference or more. Increase this to reduce N50 and mis-assemblies"/>
9 <param argument="minUniquePEsupport" type="integer" value="3" min="0" label="Minumum number of paired-end reads that provide unique support to merge two edges" help="Increase this to reduce N50 and mis-assemblies"/>
10 <param argument="minNonUniquePEsupport" type="integer" value="0" min="0" label="Minumum number of paired-end reads that provide non-unique support to merge two edgess"/>
11 <param argument="minReadsCountInEdgeToBeNotDeadEnd" type="integer" value="10" min="0" label="Minimum number of reads in an edge to be not dead-end edge"/>
12 <param argument="minEdgeLengthToBeNotDeadEnd" type="integer" value="1000" min="0" label="Minimum edge length (bp) to be not dead-end edge"/>
13 <param argument="minFoldToBeShortBranch" type="integer" value="5" min="0" label="Minimum fold difference between two branches' lengths to consider a branch to be short"/>
14 <param argument="minReadsCountToHave0Flow" type="integer" value="15" min="0" label="Minimum number of reads for an edge to be kept even if it has 0 flow"/>
15 <param argument="minEdgeLengthToHave0Flow" type="integer" value="1500" min="0" label="Minimum edge length for an edge to be kept even if it has 0 flow"/>
16 <param argument="minReadsCountInEdgeToBe1MinFlow" type="integer" value="20" min="0" label="Minimum number of reads in an edge to be assigned with 1 minimum flow"/>
17 <param argument="minEdgeLengthToBe1MinFlow" type="integer" value="2000" min="0" label="Minimum edge length to be assigned with 1 minimum flow"/>
18 </xml>
19 </macros>
20 <requirements>
21 <requirement type="package" version="@WRAPPER_VERSION@">disco</requirement>
22 </requirements>
23 <version_command>runDisco.sh --version</version_command>
24 <command detect_errors="exit_code"><![CDATA[
25 runDisco.sh
26 -n \${GALAXY_SLOTS:-4}
27 -m \${DISCO_MAX_MEMORY:-4}
28 -d .
29 -o disco
30 #if $input.library_type == "single"
31 -inS '$input.inS'
32 #else
33 #if $input.paired_input.type == "separated"
34 -in1 '$input.paired_input.in1'
35 -in2 '$input.paired_input.in2'
36 #else
37 -inP '$input.paired_input.inP'
38 #end if
39 #end if
40 $obg
41 $osg
42 -p '$first_assembly_iteration_params'
43 -p2 '$second_assembly_iteration_params'
44 -p3 '$third_assembly_iteration_params'
45 ]]></command>
46 <configfiles>
47 <configfile name="first_assembly_iteration_params">
48 <![CDATA[
49 MinOverlap4BuildGraph = $MinOverlap4BuildGraph
50 PrintContigs = true
51 PrintScaffolds = true
52 PrintUnused = $PrintUnused
53 PrintGFA = $PrintGFA
54 PrintGFA2 = $PrintGFA2
55 minSequenceLengthTobePrinted = $first_assembly_iter_param.minSequenceLengthTobePrinted
56 MinOverlap4SimplifyGraph = $first_assembly_iter_param.MinOverlap4SimplifyGraph
57 minOverlapDifference4ClipBranches = $first_assembly_iter_param.minOverlapDifference4ClipBranches
58 minUniquePEsupport = $first_assembly_iter_param.minUniquePEsupport
59 minNonUniquePEsupport = $first_assembly_iter_param.minNonUniquePEsupport
60 minReadsCountInEdgeToBeNotDeadEnd = $first_assembly_iter_param.minReadsCountInEdgeToBeNotDeadEnd
61 minEdgeLengthToBeNotDeadEnd = $first_assembly_iter_param.minEdgeLengthToBeNotDeadEnd
62 minFoldToBeShortBranch = $first_assembly_iter_param.minFoldToBeShortBranch
63 minReadsCountToHave0Flow = $first_assembly_iter_param.minReadsCountToHave0Flow
64 minEdgeLengthToHave0Flow = $first_assembly_iter_param.minEdgeLengthToHave0Flow
65 minReadsCountInEdgeToBe1MinFlow = $first_assembly_iter_param.minReadsCountInEdgeToBe1MinFlow
66 minEdgeLengthToBe1MinFlow = $first_assembly_iter_param.minEdgeLengthToBe1MinFlow
67 ]]></configfile>
68 <configfile name="second_assembly_iteration_params">
69 <![CDATA[
70 MinOverlap4BuildGraph = $MinOverlap4BuildGraph
71 PrintContigs = true
72 PrintScaffolds = true
73 PrintUnused = $PrintUnused
74 PrintGFA = $PrintGFA
75 PrintGFA2 = $PrintGFA2
76 minSequenceLengthTobePrinted = $second_assembly_iter_param.minSequenceLengthTobePrinted
77 MinOverlap4SimplifyGraph = $second_assembly_iter_param.MinOverlap4SimplifyGraph
78 minOverlapDifference4ClipBranches = $second_assembly_iter_param.minOverlapDifference4ClipBranches
79 minUniquePEsupport = $second_assembly_iter_param.minUniquePEsupport
80 minNonUniquePEsupport = $second_assembly_iter_param.minNonUniquePEsupport
81 minReadsCountInEdgeToBeNotDeadEnd = $second_assembly_iter_param.minReadsCountInEdgeToBeNotDeadEnd
82 minEdgeLengthToBeNotDeadEnd = $second_assembly_iter_param.minEdgeLengthToBeNotDeadEnd
83 minFoldToBeShortBranch = $second_assembly_iter_param.minFoldToBeShortBranch
84 minReadsCountToHave0Flow = $second_assembly_iter_param.minReadsCountToHave0Flow
85 minEdgeLengthToHave0Flow = $second_assembly_iter_param.minEdgeLengthToHave0Flow
86 minReadsCountInEdgeToBe1MinFlow = $second_assembly_iter_param.minReadsCountInEdgeToBe1MinFlow
87 minEdgeLengthToBe1MinFlow = $second_assembly_iter_param.minEdgeLengthToBe1MinFlow
88 ]]></configfile>
89 <configfile name="third_assembly_iteration_params">
90 <![CDATA[
91 MinOverlap4BuildGraph = $MinOverlap4BuildGraph
92 PrintContigs = true
93 PrintScaffolds = true
94 PrintUnused = $PrintUnused
95 PrintGFA = $PrintGFA
96 PrintGFA2 = $PrintGFA2
97 minSequenceLengthTobePrinted = $third_assembly_iter_param.minSequenceLengthTobePrinted
98 MinOverlap4SimplifyGraph = $third_assembly_iter_param.MinOverlap4SimplifyGraph
99 minOverlapDifference4ClipBranches = $third_assembly_iter_param.minOverlapDifference4ClipBranches
100 minUniquePEsupport = $third_assembly_iter_param.minUniquePEsupport
101 minNonUniquePEsupport = $third_assembly_iter_param.minNonUniquePEsupport
102 minReadsCountInEdgeToBeNotDeadEnd = $third_assembly_iter_param.minReadsCountInEdgeToBeNotDeadEnd
103 minEdgeLengthToBeNotDeadEnd = $third_assembly_iter_param.minEdgeLengthToBeNotDeadEnd
104 minFoldToBeShortBranch = $third_assembly_iter_param.minFoldToBeShortBranch
105 minReadsCountToHave0Flow = $third_assembly_iter_param.minReadsCountToHave0Flow
106 minEdgeLengthToHave0Flow = $third_assembly_iter_param.minEdgeLengthToHave0Flow
107 minReadsCountInEdgeToBe1MinFlow = $third_assembly_iter_param.minReadsCountInEdgeToBe1MinFlow
108 minEdgeLengthToBe1MinFlow = $third_assembly_iter_param.minEdgeLengthToBe1MinFlow
109 ]]></configfile>
110 </configfiles>
111 <inputs>
112 <conditional name="input">
113 <param name="library_type" type="select" label="Type of library?">
114 <option value="single">Single-end reads</option>
115 <option value="paired">Paired-end reads</option>
116 </param>
117 <when value="single">
118 <param argument="-inS" type="data" format="fastq,fasta" multiple="true" label="Single-read files"/>
119 </when>
120 <when value="paired">
121 <conditional name="paired_input">
122 <param name="type" type="select" label="Type of library?">
123 <option value="separated">Separated forward/reverse paired-read files</option>
124 <option value="interleaved">Interleaved paired-read files</option>
125 </param>
126 <when value="separated">
127 <param argument="-in1" type="data" format="fastq,fasta" label="Forward read file" />
128 <param argument="-in2" type="data" format="fastq,fasta" label="Reverse read file" />
129 </when>
130 <when value="interleaved">
131 <param argument="-inP" type="data" format="fastq,fasta" multiple="true" label="Interleaved paired-read files" />
132 </when>
133 </conditional>
134 </when>
135 </conditional>
136 <param argument="-obg" type="boolean" truevalue="-obg" falsevalue="" checked="false" label="Only build overlap graph?"/>
137 <param argument="-osg" type="boolean" truevalue="-osg" falsevalue="" checked="false" label="Only simplify existing overlap graph?"/>
138 <param argument="MinOverlap4BuildGraph" type="integer" min="0" value="20" label="Minimum overlap length (bp) required to insert an edge between two reads during graph construction" help="Increase this to reduce N50 and mis-assemblies"/>
139 <param name="log" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Output log file?"/>
140 <param argument="PrintScaffolds" type="boolean" truevalue="true" falsevalue="false" label="Print scaffolds?"/>
141 <param argument="PrintUnused" type="boolean" truevalue="true" falsevalue="false" label="Print unused reads?"/>
142 <param argument="PrintGFA" type="boolean" truevalue="true" falsevalue="false" label="Print GFA graph format?"/>
143 <param argument="PrintGFA2" type="boolean" truevalue="true" falsevalue="false" label="Print GFA2 graph format?"/>
144 <section name="first_assembly_iter_param" title="Parameters for 1st assembly iteration" expanded="False">
145 <expand macro="assembly_params"/>
146 </section>
147 <section name="second_assembly_iter_param" title="Parameters for 2nd assembly iteration" expanded="False">
148 <expand macro="assembly_params"/>
149 </section>
150 <section name="third_assembly_iter_param" title="Parameters for 3rd assembly iteration" expanded="False">
151 <expand macro="assembly_params"/>
152 </section>
153 </inputs>
154 <outputs>
155 <data format="txt" name="log" from_work_dir="disco.log" label="${tool.name} on ${on_string}: Log file">
156 <filter>log</filter>
157 </data>
158 <data format="fasta" name="contigs" from_work_dir="disco_contigsFinalCombined.fasta" label="${tool.name} on ${on_string}: Contigs"/>
159 <data format="fasta" name="scaffolds" from_work_dir="disco_scaffoldsFinalCombined.fasta" label="${tool.name} on ${on_string}: Scaffolds"/>
160 <collection name="unused_reads" type="list" label="${tool.name} on ${on_string}: Unused reads">
161 <filter>PrintUnused</filter>
162 <discover_datasets pattern="disco_0_Unused(?P&lt;designation&gt;.+)\.fasta" format="fasta" directory="assembly" />
163 </collection>
164 <collection name="gfa_graphs" type="list" label="${tool.name} on ${on_string}: GFA graph">
165 <filter>PrintGFA</filter>
166 <discover_datasets pattern="disco_Graph_(?P&lt;designation&gt;.+)\.gfa" format="txt" directory="assembly" />
167 </collection>
168 <collection name="gfa2_graphs" type="list" label="${tool.name} on ${on_string}: GFA2 graph">
169 <filter>PrintGFA2</filter>
170 <discover_datasets pattern="disco_Graph_(?P&lt;designation&gt;.+)\.gfa2" format="txt" directory="assembly" />
171 </collection>
172 </outputs>
173 <tests>
174 <test>
175 <conditional name="input">
176 <param name="library_type" value="paired"/>
177 <conditional name="paired_input">
178 <param name="type" value="separated"/>
179 <param name="in1" value="ecoli_1K_1.fq"/>
180 <param name="in2" value="ecoli_1K_2.fq"/>
181 </conditional>
182 </conditional>
183 <param name="obg" value=""/>
184 <param name="osg" value=""/>
185 <param name="MinOverlap4BuildGraph" value="20"/>
186 <param name="log" value="true"/>
187 <param name="PrintUnused" value="true"/>
188 <param name="PrintGFA" value="true"/>
189 <param name="PrintGFA2" value="true"/>
190 <section name="first_assembly_iter_param">
191 <param name="minSequenceLengthTobePrinted" value="1000"/>
192 <param name="MinOverlap4SimplifyGraph" value="30"/>
193 <param name="minOverlapDifference4ClipBranches" value="25"/>
194 <param name="minUniquePEsupport" value="3"/>
195 <param name="minNonUniquePEsupport" value="0"/>
196 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
197 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
198 <param name="minFoldToBeShortBranch" value="5"/>
199 <param name="minReadsCountToHave0Flow" value="15"/>
200 <param name="minEdgeLengthToHave0Flow" value="1500"/>
201 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
202 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
203 </section>
204 <section name="second_assembly_iter_param">
205 <param name="minSequenceLengthTobePrinted" value="1000"/>
206 <param name="MinOverlap4SimplifyGraph" value="30"/>
207 <param name="minOverlapDifference4ClipBranches" value="25"/>
208 <param name="minUniquePEsupport" value="3"/>
209 <param name="minNonUniquePEsupport" value="0"/>
210 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
211 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
212 <param name="minFoldToBeShortBranch" value="5"/>
213 <param name="minReadsCountToHave0Flow" value="15"/>
214 <param name="minEdgeLengthToHave0Flow" value="1500"/>
215 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
216 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
217 </section>
218 <section name="third_assembly_iter_param">
219 <param name="minSequenceLengthTobePrinted" value="1000"/>
220 <param name="MinOverlap4SimplifyGraph" value="30"/>
221 <param name="minOverlapDifference4ClipBranches" value="25"/>
222 <param name="minUniquePEsupport" value="3"/>
223 <param name="minNonUniquePEsupport" value="0"/>
224 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
225 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
226 <param name="minFoldToBeShortBranch" value="5"/>
227 <param name="minReadsCountToHave0Flow" value="15"/>
228 <param name="minEdgeLengthToHave0Flow" value="1500"/>
229 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
230 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
231 </section>
232 <output name="log">
233 <assert_contents>
234 <has_text text="Software: Disco Assembler" />
235 <has_text text="FIRST LOOP ITERATION 1" />
236 <has_text text="2054 reads streamed from this read file" />
237 <has_text text="Graph simplification" />
238 </assert_contents>
239 </output>
240 <output name="contigs" value="test1_contigs.fasta" compare="sim_size" delta="5"/>
241 <output name="scaffolds" value="test1_scaffolds.fasta" compare="sim_size" delta="5"/>
242 <output_collection name="unused_reads" type="list">
243 <element name="PairedReads1">
244 <assert_contents>
245 <has_text text="EAS20_8_6_1_9_1972/1" />
246 <has_text text="EAS20_8_6_10_415_709/1" />
247 <has_text text="EAS20_8_6_36_1124_470/1" />
248 <has_text text="EAS20_8_6_100_1637_1332/1" />
249 </assert_contents>
250 </element>
251 <element name="PairedReads2">
252 <assert_contents>
253 <has_text text="EAS20_8_6_1_9_1972/2" />
254 <has_text text="EAS20_8_6_10_415_709/2" />
255 <has_text text="EAS20_8_6_36_1124_470/2" />
256 <has_text text="EAS20_8_6_100_1637_1332/2" />
257 </assert_contents>
258 </element>
259 </output_collection>
260 <output_collection name="gfa_graphs" type="list">
261 <element name="1" file="test1_graph_1.gfa" compare="sim_size" delta="6000"/>
262 </output_collection>
263 <output_collection name="gfa2_graphs" type="list">
264 <element name="1" file="test1_graph_1.gfa2" compare="sim_size" delta="6000"/>
265 </output_collection>
266 </test>
267 <test>
268 <conditional name="input">
269 <param name="library_type" value="paired"/>
270 <conditional name="paired_input">
271 <param name="type" value="interleaved"/>
272 <param name="inP" value="ecoli_1K_interleaved.fq,ecoli_1K_interleaved.fq"/>
273 </conditional>
274 </conditional>
275 <param name="obg" value=""/>
276 <param name="osg" value=""/>
277 <param name="MinOverlap4BuildGraph" value="20"/>
278 <param name="log" value="true"/>
279 <param name="PrintUnused" value="false"/>
280 <param name="PrintGFA" value="false"/>
281 <param name="PrintGFA2" value="false"/>
282 <section name="first_assembly_iter_param">
283 <param name="minSequenceLengthTobePrinted" value="1000"/>
284 <param name="MinOverlap4SimplifyGraph" value="30"/>
285 <param name="minOverlapDifference4ClipBranches" value="25"/>
286 <param name="minUniquePEsupport" value="3"/>
287 <param name="minNonUniquePEsupport" value="0"/>
288 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
289 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
290 <param name="minFoldToBeShortBranch" value="5"/>
291 <param name="minReadsCountToHave0Flow" value="15"/>
292 <param name="minEdgeLengthToHave0Flow" value="1500"/>
293 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
294 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
295 </section>
296 <section name="second_assembly_iter_param">
297 <param name="minSequenceLengthTobePrinted" value="1000"/>
298 <param name="MinOverlap4SimplifyGraph" value="30"/>
299 <param name="minOverlapDifference4ClipBranches" value="25"/>
300 <param name="minUniquePEsupport" value="3"/>
301 <param name="minNonUniquePEsupport" value="0"/>
302 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
303 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
304 <param name="minFoldToBeShortBranch" value="5"/>
305 <param name="minReadsCountToHave0Flow" value="15"/>
306 <param name="minEdgeLengthToHave0Flow" value="1500"/>
307 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
308 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
309 </section>
310 <section name="third_assembly_iter_param">
311 <param name="minSequenceLengthTobePrinted" value="1000"/>
312 <param name="MinOverlap4SimplifyGraph" value="30"/>
313 <param name="minOverlapDifference4ClipBranches" value="25"/>
314 <param name="minUniquePEsupport" value="3"/>
315 <param name="minNonUniquePEsupport" value="0"/>
316 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
317 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
318 <param name="minFoldToBeShortBranch" value="5"/>
319 <param name="minReadsCountToHave0Flow" value="15"/>
320 <param name="minEdgeLengthToHave0Flow" value="1500"/>
321 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
322 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
323 </section>
324 <output name="log">
325 <assert_contents>
326 <has_text text="Software: Disco Assembler" />
327 <has_text text="FIRST LOOP ITERATION 1" />
328 <has_text text="4108 reads streamed from this read file" />
329 <has_text text="Graph simplification" />
330 </assert_contents>
331 </output>
332 <output name="contigs" value="test2_contigs.fasta" compare="sim_size" delta="5"/>
333 <output name="scaffolds" value="test2_scaffolds.fasta" compare="sim_size" delta="5"/>
334 </test>
335 <test>
336 <conditional name="input">
337 <param name="library_type" value="single"/>
338 <param name="inS" value="ecoli_1K_1.fq"/>
339 </conditional>
340 <param name="obg" value=""/>
341 <param name="osg" value=""/>
342 <param name="MinOverlap4BuildGraph" value="20"/>
343 <param name="log" value="false"/>
344 <param name="PrintUnused" value="false"/>
345 <param name="PrintGFA" value="false"/>
346 <param name="PrintGFA2" value="false"/>
347 <section name="first_assembly_iter_param">
348 <param name="minSequenceLengthTobePrinted" value="1000"/>
349 <param name="MinOverlap4SimplifyGraph" value="30"/>
350 <param name="minOverlapDifference4ClipBranches" value="25"/>
351 <param name="minUniquePEsupport" value="3"/>
352 <param name="minNonUniquePEsupport" value="0"/>
353 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
354 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
355 <param name="minFoldToBeShortBranch" value="5"/>
356 <param name="minReadsCountToHave0Flow" value="15"/>
357 <param name="minEdgeLengthToHave0Flow" value="1500"/>
358 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
359 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
360 </section>
361 <section name="second_assembly_iter_param">
362 <param name="minSequenceLengthTobePrinted" value="1000"/>
363 <param name="MinOverlap4SimplifyGraph" value="30"/>
364 <param name="minOverlapDifference4ClipBranches" value="25"/>
365 <param name="minUniquePEsupport" value="3"/>
366 <param name="minNonUniquePEsupport" value="0"/>
367 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
368 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
369 <param name="minFoldToBeShortBranch" value="5"/>
370 <param name="minReadsCountToHave0Flow" value="15"/>
371 <param name="minEdgeLengthToHave0Flow" value="1500"/>
372 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
373 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
374 </section>
375 <section name="third_assembly_iter_param">
376 <param name="minSequenceLengthTobePrinted" value="1000"/>
377 <param name="MinOverlap4SimplifyGraph" value="30"/>
378 <param name="minOverlapDifference4ClipBranches" value="25"/>
379 <param name="minUniquePEsupport" value="3"/>
380 <param name="minNonUniquePEsupport" value="0"/>
381 <param name="minReadsCountInEdgeToBeNotDeadEnd" value="10"/>
382 <param name="minEdgeLengthToBeNotDeadEnd" value="1000"/>
383 <param name="minFoldToBeShortBranch" value="5"/>
384 <param name="minReadsCountToHave0Flow" value="15"/>
385 <param name="minEdgeLengthToHave0Flow" value="1500"/>
386 <param name="minReadsCountInEdgeToBe1MinFlow" value="20"/>
387 <param name="minEdgeLengthToBe1MinFlow" value="2000"/>
388 </section>
389 <output name="contigs" value="test3_contigs.fasta" compare="sim_size" delta="5"/>
390 <output name="scaffolds" value="test3_scaffolds.fasta" compare="sim_size" delta="5"/>
391 </test>
392 </tests>
393 <help><![CDATA[
394 DISCO is a multi threaded and multiprocess distributed memory overlap-layout-consensus (OLC) metagenome assembler. Disco was developed as a scalable assembler to assemble large metagenomes from billions of Illumina sequencing reads of complex microbial communities. Disco was parallelized for computer clusters in a hybrid architecture that integrated shared-memory multi-threading, point-to-point message passing, and remote direct memory access. The assembly and scaffolding were performed using an iterative overlap graph approach.
395
396 The detailed user manual of the assembler and how to use it to acheive best results is provided here: http://disco.omicsbio.org/user-manual. This is a quick start guide generally for developers and testers. Users with limited experience with genome assembly are advised to use the user manual.
397 ]]></help>
398 <citations>
399 </citations>
400 </tool>