Mercurial > repos > iuc > breseq
comparison breseq.xml @ 0:a7735dbd58ee draft
"planemo upload commit fadaff2d55736bf8c580541d6089c83cd4106a1f"
| author | iuc |
|---|---|
| date | Thu, 31 Oct 2019 19:40:15 -0400 |
| parents | |
| children | 256cd7d32d15 |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:a7735dbd58ee |
|---|---|
| 1 <tool id="breseq" name="breseq" version="@PACKAGE_VERSION@+@GALAXY_VERSION@"> | |
| 2 | |
| 3 <description>find mutations in haploid microbial genomes</description> | |
| 4 | |
| 5 <macros> | |
| 6 <import>macros.xml</import> | |
| 7 </macros> | |
| 8 | |
| 9 <requirements> | |
| 10 <requirement type="package" version="0.34.0">breseq</requirement> | |
| 11 </requirements> | |
| 12 | |
| 13 <version_command>breseq --version</version_command> | |
| 14 | |
| 15 <command detect_errors="aggressive"> | |
| 16 <![CDATA[ | |
| 17 #set $ref_opts = "" | |
| 18 #for $i, $r in enumerate( $references ): | |
| 19 #if str($references[$i].reference.source) == "history": | |
| 20 #for $ref in $references[$i].reference.own_genome: | |
| 21 #if $ref | |
| 22 #set $ref_opts = $ref_opts + " --reference '" + str($ref) + "'" | |
| 23 #end if | |
| 24 #end for | |
| 25 #else: | |
| 26 #set $ref_opts = $ref_opts + " --reference '" + $references[$i].reference.fixed_genome.fields.path + "'" | |
| 27 #end if | |
| 28 #end for | |
| 29 | |
| 30 #if str($run.mode) == 'detect' | |
| 31 breseq | |
| 32 | |
| 33 --num-processors \${GALAXY_SLOTS:-4} | |
| 34 | |
| 35 -o results | |
| 36 | |
| 37 $ref_opts | |
| 38 | |
| 39 #for $s in $run.fastqs: | |
| 40 ${s} | |
| 41 #end for | |
| 42 | |
| 43 #if $run.name | |
| 44 --name '$run.name' | |
| 45 #end if | |
| 46 | |
| 47 $run.polymorphism_prediction | |
| 48 $run.predict_junctions | |
| 49 | |
| 50 #if 'gd' in str($run.output_options.formats).split(','): | |
| 51 && cp results/output/output.gd '$output' | |
| 52 #end if | |
| 53 | |
| 54 #if 'html' in str($run.output_options.formats).split(','): | |
| 55 && cp results/output/index.html '$report' | |
| 56 && mkdir $report.extra_files_path | |
| 57 && cp -R results/output/* $report.extra_files_path | |
| 58 #end if | |
| 59 | |
| 60 #if 'zip' in str($run.output_options.formats).split(','): | |
| 61 && tar -zcf '$zip_output' results | |
| 62 #end if | |
| 63 | |
| 64 #if 'log' in str($run.output_options.formats).split(','): | |
| 65 && cp results/output/log.txt '$log' | |
| 66 #end if | |
| 67 #else | |
| 68 #set $first = 1 | |
| 69 #for $o in str($run.output_options.formats).split(','): | |
| 70 | |
| 71 #if $first == 0 | |
| 72 && | |
| 73 #end if | |
| 74 #set $first = 0 | |
| 75 | |
| 76 gdtools ANNOTATE | |
| 77 | |
| 78 --format '$o' | |
| 79 | |
| 80 -o | |
| 81 #if $o == 'html': | |
| 82 '$annreport' | |
| 83 #else if $o == 'gd': | |
| 84 '$genomediff' | |
| 85 #else if $o == 'tsv': | |
| 86 '$tabdelim' | |
| 87 #else if $o == 'phylip': | |
| 88 '$phylipout' | |
| 89 #else if $o == 'json': | |
| 90 '$jsonout' | |
| 91 #end if | |
| 92 | |
| 93 $ref_opts | |
| 94 | |
| 95 #for $s in $run.gds: | |
| 96 ${s} | |
| 97 #end for | |
| 98 #end for | |
| 99 #end if | |
| 100 ]]> | |
| 101 </command> | |
| 102 | |
| 103 <inputs> | |
| 104 <repeat name="references" title="Reference Genome" min="1"> | |
| 105 <conditional name="reference"> | |
| 106 <param name="source" type="select" label="Reference source" > | |
| 107 <option value="builtin">built-in</option> | |
| 108 <option value="history" selected="true">history</option> | |
| 109 </param> | |
| 110 <when value="builtin"> | |
| 111 <param name="fixed_genome" argument="--reference" type="select" optional="false" label="Galaxy Built-in Reference(s)"> | |
| 112 <options from_data_table="genbank_files"> | |
| 113 <filter type="sort_by" column="3"/> | |
| 114 <validator type="no_options" message="No built-in genbank records have been configured"/> | |
| 115 </options> | |
| 116 </param> | |
| 117 </when> | |
| 118 <when value="history"> | |
| 119 <param name="own_genome" argument="--reference" type="data" format="fasta,genbank" multiple="true" optional="false" label="Fasta or Genbank Reference(s)" /> | |
| 120 </when> | |
| 121 </conditional> | |
| 122 </repeat> | |
| 123 | |
| 124 <conditional name="run"> | |
| 125 <param name="mode" type="select" label="Run Mode" help="Detect, annotate, or compare variants."> | |
| 126 <option value="detect" selected="true">Detect</option> | |
| 127 <option value="annotate">Annotate</option> | |
| 128 <option value="compare">Compare</option> | |
| 129 </param> | |
| 130 <when value="detect"> | |
| 131 | |
| 132 <param name="fastqs" type="data" format="fastq" multiple="true" label="Fastq Read Files" /> | |
| 133 | |
| 134 <param argument="--polymorphism-prediction" name="polymorphism_prediction" type="select" label="Detection Mode" help="**Polymorphism mode**: Detect variants with frequencies between 0% and 100% if a mixture model is well-supported by the read alignment evidence. Use to analyze a mixed population of genomes evolved from a common ancestor. **Consensus mode**: Detect variants present in 100% of the sample. Use when re-sequencing a clonal haploid genome. This mode is the default."> | |
| 135 <option value="" selected="true">Consensus</option> | |
| 136 <option value="--polymorphism-prediction">Polymorphism</option> | |
| 137 </param> | |
| 138 | |
| 139 <param name="name" argument="--name" type="text" value="" label="Analysis Name" help="Human-readable name of the analysis run for output (DEFAULT=none)." /> | |
| 140 | |
| 141 <param name="predict_junctions" type="boolean" truevalue="" falsevalue="--no-junction-prediction" checked="true" label="Predict Junctions" help="Predict new sequence junctions (default). --no-junction-prediction is supplied if 'No' is selected. Otherwise, there is no flag." /> | |
| 142 | |
| 143 <section name="output_options" title="Output Options" expanded="false"> | |
| 144 <param name="formats" type="select" multiple="true" optional="false" display="checkboxes" label="Output Formats"> | |
| 145 <option value="gd" selected="true">Variants (GenomeDiff)</option> | |
| 146 <option value="html">Variant Report (Webpage)</option> | |
| 147 <option value="zip">All Variant Results (Gzip)</option> | |
| 148 <option value="log">Log (Text)</option> | |
| 149 </param> | |
| 150 </section> | |
| 151 | |
| 152 </when> | |
| 153 <when value="annotate"> | |
| 154 | |
| 155 <param name="gds" type="data" format="tabular" multiple="true" optional="false" label="GenomeDiff (gd) Files" help="Files as produced by breseq" /> | |
| 156 | |
| 157 <expand macro="annotate_format_opts"> | |
| 158 <option value="gd" selected="true">Annotated Variants (GenomeDiff)</option> | |
| 159 </expand> | |
| 160 | |
| 161 </when> | |
| 162 <when value="compare"> | |
| 163 | |
| 164 <param name="gds" type="data" format="tabular" multiple="true" optional="false" label="GenomeDiff (gd) Files" help="Files as produced by breseq" min="2" /> | |
| 165 | |
| 166 <expand macro="annotate_format_opts"> | |
| 167 <option value="phylip" selected="true">Variant Comparison (Phylip)</option> | |
| 168 <option value="gd">Annotated Variants (GenomeDiff)</option> | |
| 169 </expand> | |
| 170 | |
| 171 </when> | |
| 172 </conditional> | |
| 173 | |
| 174 </inputs> | |
| 175 | |
| 176 <outputs> | |
| 177 <data format="html" name="report" label="${tool.name} on ${on_string}: Variants (Webpage)"> | |
| 178 <filter>run['mode'] == 'detect' and 'html' in run['output_options']['formats']</filter> | |
| 179 </data> | |
| 180 <data format="html" name="annreport" label="${tool.name} on ${on_string}: Annotated Variants Report (Webpage)"> | |
| 181 <filter>run['mode'] != 'detect' and 'html' in run['output_options']['formats']</filter> | |
| 182 </data> | |
| 183 | |
| 184 <data format="tabular" name="output" label="${tool.name} on ${on_string}: Variants (GenomeDiff)"> | |
| 185 <filter>run['mode'] == 'detect' and 'gd' in run['output_options']['formats']</filter> | |
| 186 </data> | |
| 187 <data format="tabular" name="genomediff" label="${tool.name} on ${on_string}: Annotated Variants (GenomeDiff)"> | |
| 188 <filter>run['mode'] != 'detect' and 'gd' in run['output_options']['formats']</filter> | |
| 189 </data> | |
| 190 | |
| 191 <data format="zip" name="zip_output" label="${tool.name} on ${on_string}: All Variant Results (Gzip)"> | |
| 192 <filter>'zip' in run['output_options']['formats']</filter> | |
| 193 </data> | |
| 194 <data format="txt" name="log" label="${tool.name} on ${on_string}: Breseq Log"> | |
| 195 <filter>'log' in run['output_options']['formats']</filter> | |
| 196 </data> | |
| 197 <data format="tabular" name="tabdelim" label="${tool.name} on ${on_string}: Annotated Variants (Tabular)"> | |
| 198 <filter>'tsv' in run['output_options']['formats']</filter> | |
| 199 </data> | |
| 200 <data format="phylip" name="phylipout" label="${tool.name} on ${on_string}: Variant Comparison (Phylip)"> | |
| 201 <filter>'phylip' in run['output_options']['formats']</filter> | |
| 202 </data> | |
| 203 <data format="txt" name="jsonout" label="${tool.name} on ${on_string}: Annotated Variants (JSON)"> | |
| 204 <filter>'json' in run['output_options']['formats']</filter> | |
| 205 </data> | |
| 206 </outputs> | |
| 207 | |
| 208 <tests> | |
| 209 <test> | |
| 210 <repeat name="references"> | |
| 211 <conditional name="reference"> | |
| 212 <param name="source" value="history" /> | |
| 213 <param name="own_genome" value="lambda.gbk" /> | |
| 214 </conditional> | |
| 215 </repeat> | |
| 216 <conditional name="run"> | |
| 217 <param name="mode" value="detect" /> | |
| 218 <param name="fastqs" value="lambda.short_sequence_repeats.fastq" /> | |
| 219 <param name="polymorphism_prediction" value="" /> | |
| 220 <param name="name" value="smallest" /> | |
| 221 <param name="predict_junctions" value="" /> | |
| 222 <section name="output_options"> | |
| 223 <param name="formats" value="html,log,gd,zip" /> | |
| 224 </section> | |
| 225 </conditional> | |
| 226 | |
| 227 <output name="report" file="report.html" compare="sim_size" delta="100" /> | |
| 228 <output name="log" file="log.txt" lines_diff="4"> | |
| 229 <assert_contents> | |
| 230 <has_text text="breseq --num-processors" /> | |
| 231 </assert_contents> | |
| 232 </output> | |
| 233 <output name="output" file="gdout.txt" lines_diff="8" /> | |
| 234 <output name="zip_output"> | |
| 235 <assert_contents> | |
| 236 <has_archive_member path="results/output/output.gd" /> | |
| 237 </assert_contents> | |
| 238 </output> | |
| 239 </test> | |
| 240 <test> | |
| 241 <repeat name="references"> | |
| 242 <conditional name="reference"> | |
| 243 <param name="source" value="builtin" /> | |
| 244 <param name="fixed_genome" value="lambda1" /> | |
| 245 </conditional> | |
| 246 </repeat> | |
| 247 <conditional name="run"> | |
| 248 <param name="mode" value="detect" /> | |
| 249 <param name="fastqs" value="lambda.short_sequence_repeats.fastq" /> | |
| 250 <param name="polymorphism_prediction" value="" /> | |
| 251 <param name="name" value="smallest" /> | |
| 252 <param name="predict_junctions" value="" /> | |
| 253 <section name="output_options"> | |
| 254 <param name="formats" value="gd" /> | |
| 255 </section> | |
| 256 </conditional> | |
| 257 | |
| 258 <output name="output" file="gdout.txt" lines_diff="8" /> | |
| 259 </test> | |
| 260 <test> | |
| 261 <repeat name="references"> | |
| 262 <conditional name="reference"> | |
| 263 <param name="source" value="history" /> | |
| 264 <param name="own_genome" value="lambda.gbk" /> | |
| 265 </conditional> | |
| 266 </repeat> | |
| 267 <conditional name="run"> | |
| 268 <param name="mode" value="annotate" /> | |
| 269 <param name="gds" value="gdout.txt" /> | |
| 270 <section name="output_options"> | |
| 271 <param name="formats" value="html" /> | |
| 272 </section> | |
| 273 </conditional> | |
| 274 | |
| 275 <output name="annreport" file="gdtoolsout.html" compare="sim_size" delta="100" /> | |
| 276 </test> | |
| 277 </tests> | |
| 278 | |
| 279 <help> | |
| 280 <![CDATA[ | |
| 281 **Detect Variants** | |
| 282 | |
| 283 breseq (pronounced: \\brēz-ˈsēk\\ or breeze-seq) is a computational pipeline for | |
| 284 the analysis of short-read re-sequencing data (e.g. Illumina, 454, IonTorrent, | |
| 285 etc.). It uses reference-based alignment approaches to predict mutations in a | |
| 286 sample relative to an already sequenced genome. breseq is intended for microbial | |
| 287 genomes (<10 Mb) and re-sequenced samples that are only slightly diverged from | |
| 288 the reference sequence (<1 mutation per 1000 bp). | |
| 289 | |
| 290 breseq's primary advantages over other software programs are that it can: | |
| 291 | |
| 292 - Accurately predict new sequence junctions, such as those associated with mobile element insertions. | |
| 293 - Integrate multiple sources of evidence for genetic changes into mutation predictions. | |
| 294 - Produce annotated output describing biologically relevant mutational events. | |
| 295 | |
| 296 breseq was initially developed to analyze data from the Lenski long-term | |
| 297 evolution experiment with `E. coli`_. References: barrick2009a_ barrick2009b_. | |
| 298 | |
| 299 .. _`E. coli`: http://myxo.css.msu.edu/ecoli/ | |
| 300 .. _barrick2009a: http://barricklab.org/twiki/pub/Lab/ToolsBacterialGenomeResequencing/documentation/references.html#barrick2009a | |
| 301 .. _barrick2009b: http://barricklab.org/twiki/pub/Lab/ToolsBacterialGenomeResequencing/documentation/references.html#barrick2009b | |
| 302 | |
| 303 However, breseq may be generally useful to researchers who are: | |
| 304 | |
| 305 - Tracking mutations over time in microbial evolution experiments. | |
| 306 - Checking strains for unwanted second-site mutations after genetic manipulations. | |
| 307 - Identifying mutations that occur during strain improvement or after long-term culture of engineered strains. | |
| 308 - Discovering what mutations arise in pathogens during infection or cause antibiotic resistance. | |
| 309 | |
| 310 | |
| 311 *Inputs* | |
| 312 | |
| 313 Breseq accepts files in FASTQ format. It does not take pair-end information into | |
| 314 account. | |
| 315 | |
| 316 You can either run in clonal (consensus) mode or search for polymorphisms in a | |
| 317 population. | |
| 318 | |
| 319 You can also select an external sequence (eg. a transposon) to detect for | |
| 320 insertions or horizontal transfer. | |
| 321 | |
| 322 | |
| 323 *Outputs* | |
| 324 | |
| 325 Breseq outputs a number of files. These are all condensed in a single zipped | |
| 326 file. | |
| 327 | |
| 328 It contains output files with the final results, accessible through | |
| 329 ``output/index.html`` | |
| 330 | |
| 331 It also contains data files with accessory data, including: | |
| 332 | |
| 333 - ``data/reference.fasta`` (file with reference genome: can be used in eg. IGV browser) | |
| 334 - ``data/reference.gff`` (file with genomic annotations: can be used in eg. IGV browser) | |
| 335 - ``data/areference.bam`` (file with read alignments: can be used in eg. IGV browser) | |
| 336 - ``data/unmatched.*`` (files with read that failed to align: can be used to build an assembly or to eg. blast against NCBI) | |
| 337 | |
| 338 | |
| 339 ---- | |
| 340 | |
| 341 **Annotate Variants** | |
| 342 | |
| 343 Annotate a GenomeDiff file (generated by breseq) with information about | |
| 344 mutations (what genes they affect, amino acid substitutions, etc.) If multiple | |
| 345 input files are provided, then also COMPARE the frequencies for identical | |
| 346 mutations across samples. | |
| 347 ]]> | |
| 348 </help> | |
| 349 | |
| 350 <citations> | |
| 351 <citation type="doi">10.1007/978-1-4939-0554-6_12</citation> | |
| 352 </citations> | |
| 353 | |
| 354 </tool> |
