Mercurial > repos > pjbriggs > trimmomatic
annotate trimmomatic.xml @ 14:0fb869e9dee6 draft
Update to Trimmomatic 0.38.
| author | pjbriggs |
|---|---|
| date | Mon, 08 Jul 2019 06:07:07 -0400 |
| parents | 361f703e4094 |
| children | d300b1888cef |
| rev | line source |
|---|---|
| 14 | 1 <tool id="trimmomatic" name="Trimmomatic" version="0.38.0"> |
| 1 | 2 <description>flexible read trimming tool for Illumina NGS data</description> |
|
5
b0315888eb4d
Test for version which is compatible with conda dependency resolver.
pjbriggs
parents:
4
diff
changeset
|
3 <macros> |
|
b0315888eb4d
Test for version which is compatible with conda dependency resolver.
pjbriggs
parents:
4
diff
changeset
|
4 <import>trimmomatic_macros.xml</import> |
|
b0315888eb4d
Test for version which is compatible with conda dependency resolver.
pjbriggs
parents:
4
diff
changeset
|
5 </macros> |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
6 <requirements> |
| 14 | 7 <requirement type="package" version="0.38">trimmomatic</requirement> |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
8 </requirements> |
| 7 | 9 <command detect_errors="aggressive"><![CDATA[ |
|
5
b0315888eb4d
Test for version which is compatible with conda dependency resolver.
pjbriggs
parents:
4
diff
changeset
|
10 @CONDA_TRIMMOMATIC_JAR_PATH@ && |
|
b0315888eb4d
Test for version which is compatible with conda dependency resolver.
pjbriggs
parents:
4
diff
changeset
|
11 @CONDA_TRIMMOMATIC_ADAPTERS_PATH@ && |
| 7 | 12 #if $readtype.single_or_paired == "pair_of_files" |
| 13 #set r1_ext = $readtype.fastq_r1_in.extension | |
| 14 #set r2_ext = $readtype.fastq_r2_in.extension | |
| 15 ln -s '$readtype.fastq_r1_in' fastq_r1.'$r1_ext' && | |
| 16 ln -s '$readtype.fastq_r2_in' fastq_r2.'$r2_ext' && | |
| 17 #elif $readtype.single_or_paired == "collection" | |
| 18 #set r1_ext = $readtype.fastq_pair.forward.extension | |
| 19 #set r2_ext = $readtype.fastq_pair.reverse.extension | |
| 20 ln -s '$readtype.fastq_pair.forward' fastq_r1.'$r1_ext' && | |
| 21 ln -s '$readtype.fastq_pair.reverse' fastq_r2.'$r2_ext' && | |
| 22 #else | |
| 23 ln -s '$fastq_in' fastq_in.'$fastq_in.extension' && | |
| 24 #end if | |
| 25 java \${_JAVA_OPTIONS:--Xmx8G} -jar \$TRIMMOMATIC_JAR_PATH/trimmomatic.jar | |
| 26 #if $readtype.single_or_paired in ["pair_of_files","collection"] | |
| 12 | 27 PE -threads \${GALAXY_SLOTS:-6} |
| 7 | 28 fastq_r1.'$r1_ext' fastq_r2.'$r2_ext' |
| 29 fastq_out_r1_paired.'$r1_ext' fastq_out_r1_unpaired.'$r1_ext' | |
| 30 fastq_out_r2_paired.'$r2_ext' fastq_out_r2_unpaired.'$r2_ext' | |
| 1 | 31 #else |
| 12 | 32 SE -threads \${GALAXY_SLOTS:-6} fastq_in.'$fastq_in.extension' fastq_out.'$fastq_in.extension' |
| 1 | 33 #end if |
| 34 ## ILLUMINACLIP option | |
| 35 #if $illuminaclip.do_illuminaclip | |
| 9 | 36 #if $illuminaclip.adapter_type.standard_or_custom == "custom" |
| 37 #if $readtype.single_or_paired in ["pair_of_files","collection"] | |
| 38 ILLUMINACLIP:$adapter_file_from_text:$illuminaclip.seed_mismatches:$illuminaclip.palindrome_clip_threshold:$illuminaclip.simple_clip_threshold:$illuminaclip.min_adapter_len:$illuminaclip.keep_both_reads | |
| 39 #else | |
| 40 ILLUMINACLIP:$adapter_file_from_text:$illuminaclip.seed_mismatches:$illuminaclip.palindrome_clip_threshold:$illuminaclip.simple_clip_threshold | |
| 41 #end if | |
| 42 #else | |
| 43 #if $readtype.single_or_paired in ["pair_of_files","collection"] | |
| 44 ILLUMINACLIP:\$TRIMMOMATIC_ADAPTERS_PATH/$illuminaclip.adapter_type.adapter_fasta:$illuminaclip.seed_mismatches:$illuminaclip.palindrome_clip_threshold:$illuminaclip.simple_clip_threshold:$illuminaclip.min_adapter_len:$illuminaclip.keep_both_reads | |
| 45 #else | |
| 46 ILLUMINACLIP:\$TRIMMOMATIC_ADAPTERS_PATH/$illuminaclip.adapter_type.adapter_fasta:$illuminaclip.seed_mismatches:$illuminaclip.palindrome_clip_threshold:$illuminaclip.simple_clip_threshold | |
| 47 #end if | |
| 48 #end if | |
| 1 | 49 #end if |
| 50 ## Other operations | |
| 51 #for $op in $operations | |
| 52 ## SLIDINGWINDOW | |
| 53 #if str( $op.operation.name ) == "SLIDINGWINDOW" | |
| 54 SLIDINGWINDOW:$op.operation.window_size:$op.operation.required_quality | |
| 55 #end if | |
| 56 ## MINLEN:36 | |
| 57 #if str( $op.operation.name ) == "MINLEN" | |
| 58 MINLEN:$op.operation.minlen | |
| 59 #end if | |
| 60 #if str( $op.operation.name ) == "LEADING" | |
| 61 LEADING:$op.operation.leading | |
| 62 #end if | |
| 63 #if str( $op.operation.name ) == "TRAILING" | |
| 64 TRAILING:$op.operation.trailing | |
| 65 #end if | |
| 66 #if str( $op.operation.name ) == "CROP" | |
| 67 CROP:$op.operation.crop | |
| 68 #end if | |
| 69 #if str( $op.operation.name ) == "HEADCROP" | |
| 70 HEADCROP:$op.operation.headcrop | |
| 71 #end if | |
| 4 | 72 #if str( $op.operation.name ) == "AVGQUAL" |
| 73 AVGQUAL:$op.operation.avgqual | |
| 74 #end if | |
| 75 #if str( $op.operation.name ) == "MAXINFO" | |
| 76 MAXINFO:$op.operation.target_length:$op.operation.strictness | |
| 77 #end if | |
| 1 | 78 #end for |
| 12 | 79 #if $output_logs: |
| 80 -trimlog trimlog | |
| 81 #end if | |
|
5
b0315888eb4d
Test for version which is compatible with conda dependency resolver.
pjbriggs
parents:
4
diff
changeset
|
82 2>&1 | tee trimmomatic.log && |
|
b0315888eb4d
Test for version which is compatible with conda dependency resolver.
pjbriggs
parents:
4
diff
changeset
|
83 if [ -z "\$(tail -1 trimmomatic.log | grep "Completed successfully")" ]; then echo "Trimmomatic did not finish successfully" >&2 ; exit 1 ; fi |
| 7 | 84 && |
| 85 #if $readtype.single_or_paired == "pair_of_files" | |
| 86 mv fastq_out_r1_paired.'$r1_ext' '${fastq_out_r1_paired}' && | |
| 87 mv fastq_out_r1_unpaired.'$r1_ext' '${fastq_out_r1_unpaired}' && | |
| 88 mv fastq_out_r2_paired.'$r2_ext' '${fastq_out_r2_paired}' && | |
| 89 mv fastq_out_r2_unpaired.'$r2_ext' '${fastq_out_r2_unpaired}' | |
| 90 #elif $readtype.single_or_paired == "collection" | |
| 91 mv fastq_out_r1_paired.'$r1_ext' '${fastq_out_paired.forward}' && | |
| 92 mv fastq_out_r1_unpaired.'$r1_ext' '${fastq_out_unpaired.forward}' && | |
| 93 mv fastq_out_r2_paired.'$r2_ext' '${fastq_out_paired.reverse}' && | |
| 94 mv fastq_out_r2_unpaired.'$r2_ext' '${fastq_out_unpaired.reverse}' | |
| 95 #else | |
| 96 mv fastq_out.'$fastq_in.extension' '${fastq_out}' | |
| 97 #end if | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
98 ]]></command> |
| 9 | 99 <configfiles> |
| 100 <configfile name="adapter_file_from_text">#set from_text_area = '' | |
| 101 #if str( $illuminaclip.do_illuminaclip ) == "yes" and str( $illuminaclip.adapter_type.standard_or_custom ) == "custom": | |
| 102 #set from_text_area = $illuminaclip.adapter_type.adapter_text | |
| 103 #end if | |
| 104 ${from_text_area}</configfile> | |
| 105 </configfiles> | |
| 106 | |
| 1 | 107 <inputs> |
| 7 | 108 <conditional name="readtype"> |
| 109 <param name="single_or_paired" type="select" label="Single-end or paired-end reads?"> | |
| 110 <option value="se" selected="true">Single-end</option> | |
| 111 <option value="pair_of_files">Paired-end (two separate input files)</option> | |
| 112 <option value="collection">Paired-end (as collection)</option> | |
| 113 </param> | |
| 114 <when value="se"> | |
| 12 | 115 <param name="fastq_in" type="data" format="fastqsanger,fastqsanger.gz,fastqillumina,fastqillumina.gz,fastqsolexa,fastqsolexa.gz" label="Input FASTQ file" /> |
| 1 | 116 </when> |
| 7 | 117 <when value="pair_of_files"> |
| 12 | 118 <param name="fastq_r1_in" type="data" format="fastqsanger,fastqsanger.gz,fastqillumina,fastqillumina.gz,fastqsolexa,fastqsolexa.gz" |
| 7 | 119 label="Input FASTQ file (R1/first of pair)" /> |
| 12 | 120 <param name="fastq_r2_in" type="data" format="fastqsanger,fastqsanger.gz,fastqillumina,fastqillumina.gz,fastqsolexa,fastqsolexa.gz" |
| 7 | 121 label="Input FASTQ file (R2/second of pair)" /> |
| 1 | 122 </when> |
| 7 | 123 <when value="collection"> |
| 12 | 124 <param name="fastq_pair" format="fastqsanger,fastqsanger.gz,fastqillumina,fastqillumina.gz,fastqsolexa,fastqsolexa.gz" type="data_collection" collection_type="paired" label="Select FASTQ dataset collection with R1/R2 pair" /> |
| 7 | 125 </when> |
| 1 | 126 </conditional> |
| 127 <conditional name="illuminaclip"> | |
| 7 | 128 <param name="do_illuminaclip" type="boolean" label="Perform initial ILLUMINACLIP step?" help="Cut adapter and other illumina-specific sequences from the read" truevalue="yes" falsevalue="no" checked="False" /> |
| 129 <when value="yes"> | |
| 9 | 130 <conditional name="adapter_type"> |
| 131 <param name="standard_or_custom" type="select" label="Select standard adapter sequences or provide custom?"> | |
| 132 <option value="standard" selected="true">Standard</option> | |
| 133 <option value="custom">Custom</option> | |
| 134 </param> | |
| 135 <when value="standard"> | |
| 136 <param name="adapter_fasta" type="select" label="Adapter sequences to use"> | |
| 137 <option value="TruSeq2-SE.fa">TruSeq2 (single-ended, for Illumina GAII)</option> | |
| 138 <option value="TruSeq3-SE.fa">TruSeq3 (single-ended, for MiSeq and HiSeq)</option> | |
| 139 <option value="TruSeq2-PE.fa">TruSeq2 (paired-ended, for Illumina GAII)</option> | |
| 140 <option value="TruSeq3-PE.fa">TruSeq3 (paired-ended, for MiSeq and HiSeq)</option> | |
| 141 <option value="TruSeq3-PE-2.fa">TruSeq3 (additional seqs) (paired-ended, for MiSeq and HiSeq)</option> | |
| 142 <option value="NexteraPE-PE.fa">Nextera (paired-ended)</option> | |
| 143 </param> | |
| 144 </when> | |
| 145 <when value="custom"> | |
| 146 <param name="adapter_text" type="text" area="True" size="10x30" value="" | |
| 147 label="Custom adapter sequences in fasta format" help="Write sequences in the fasta format."> | |
| 148 <sanitizer> | |
| 149 <valid initial="string.printable"></valid> | |
| 150 <mapping initial="none"/> | |
| 151 </sanitizer> | |
| 152 </param> | |
| 153 </when> | |
| 154 </conditional> | |
| 7 | 155 <param name="seed_mismatches" type="integer" label="Maximum mismatch count which will still allow a full match to be performed" value="2" /> |
| 156 <param name="palindrome_clip_threshold" type="integer" label="How accurate the match between the two 'adapter ligated' reads must be for PE palindrome read alignment" value="30" /> | |
| 157 <param name="simple_clip_threshold" type="integer" label="How accurate the match between any adapter etc. sequence must be against a read" value="10" /> | |
| 9 | 158 <param name="min_adapter_len" type="integer" label="Minimum length of adapter that needs to be detected (PE specific/palindrome mode)" value="8" /> |
| 159 <param name="keep_both_reads" type="boolean" label="Always keep both reads (PE specific/palindrome mode)?" truevalue="true" falsevalue="false" checked="true" | |
| 160 help="See help below"/> | |
| 7 | 161 </when> |
| 162 <when value="no" /> <!-- empty clause to satisfy planemo lint --> | |
| 1 | 163 </conditional> |
| 164 <repeat name="operations" title="Trimmomatic Operation" min="1"> | |
| 165 <conditional name="operation"> | |
| 7 | 166 <param name="name" type="select" label="Select Trimmomatic operation to perform"> |
| 167 <option selected="true" value="SLIDINGWINDOW">Sliding window trimming (SLIDINGWINDOW)</option> | |
| 168 <option value="MINLEN">Drop reads below a specified length (MINLEN)</option> | |
| 169 <option value="LEADING">Cut bases off the start of a read, if below a threshold quality (LEADING)</option> | |
| 170 <option value="TRAILING">Cut bases off the end of a read, if below a threshold quality (TRAILING)</option> | |
| 171 <option value="CROP">Cut the read to a specified length (CROP)</option> | |
| 172 <option value="HEADCROP">Cut the specified number of bases from the start of the read (HEADCROP)</option> | |
| 173 <option value="AVGQUAL">Drop reads with average quality lower than a specified level (AVGQUAL)</option> | |
| 174 <option value="MAXINFO">Trim reads adaptively, balancing read length and error rate to maximise the value of each read (MAXINFO)</option> | |
| 175 </param> | |
| 176 <when value="SLIDINGWINDOW"> | |
| 177 <param name="window_size" type="integer" label="Number of bases to average across" value="4" /> | |
| 178 <param name="required_quality" type="integer" label="Average quality required" value="20" /> | |
| 179 </when> | |
| 180 <when value="MINLEN"> | |
| 181 <param name="minlen" type="integer" label="Minimum length of reads to be kept" value="20" /> | |
| 182 </when> | |
| 183 <when value="LEADING"> | |
| 184 <param name="leading" type="integer" label="Minimum quality required to keep a base" value="3" help="Bases at the start of the read with quality below the threshold will be removed" /> | |
| 185 </when> | |
| 186 <when value="TRAILING"> | |
| 187 <param name="trailing" type="integer" label="Minimum quality required to keep a base" value="3" help="Bases at the end of the read with quality below the threshold will be removed" /> | |
| 188 </when> | |
| 189 <when value="CROP"> | |
| 190 <param name="crop" type="integer" label="Number of bases to keep from the start of the read" value="" /> | |
| 191 </when> | |
| 192 <when value="HEADCROP"> | |
| 193 <param name="headcrop" type="integer" label="Number of bases to remove from the start of the read" value="" /> | |
| 194 </when> | |
| 195 <when value="AVGQUAL"> | |
| 196 <param name="avgqual" type="integer" label="Minimum average quality required to keep a read" value="" /> | |
| 197 </when> | |
| 198 <when value="MAXINFO"> | |
| 199 <param name="target_length" type="integer" label="Target read length" value="" help="The read length which is likely to allow the location of the read within the target sequence to be determined." /> | |
| 200 <param name="strictness" type="float" label="Strictness" value="" help="Set between zero and one - specifies the balance between preserving read length versus removal of incorrect bases; low values (<0.2) favours longer reads, high values (>0.8) favours read correctness." /> | |
| 201 </when> | |
| 1 | 202 </conditional> |
| 203 </repeat> | |
| 12 | 204 <param name="output_logs" argument="-trimlog" type="boolean" label="Output trimlog file?" truevalue="yes" falsevalue="no" checked="False" /> |
| 205 <param name="output_err" type="boolean" label="Output trimmomatic log messages?" truevalue="yes" falsevalue="no" checked="False" help="these are the messages written to stderr (eg. for use in MultiQC)" /> | |
| 1 | 206 </inputs> |
| 207 <outputs> | |
| 7 | 208 <data name="fastq_out_r1_paired" label="${tool.name} on ${readtype.fastq_r1_in.name} (R1 paired)" format_source="fastq_r1_in"> |
| 209 <filter>readtype['single_or_paired'] == "pair_of_files"</filter> | |
| 1 | 210 </data> |
| 7 | 211 <data name="fastq_out_r2_paired" label="${tool.name} on ${readtype.fastq_r2_in.name} (R2 paired)" format_source="fastq_r2_in"> |
| 212 <filter>readtype['single_or_paired'] == "pair_of_files"</filter> | |
| 1 | 213 </data> |
| 7 | 214 <data name="fastq_out_r1_unpaired" label="${tool.name} on ${readtype.fastq_r1_in.name} (R1 unpaired)" format_source="fastq_r1_in"> |
| 215 <filter>readtype['single_or_paired'] == "pair_of_files"</filter> | |
| 1 | 216 </data> |
| 7 | 217 <data name="fastq_out_r2_unpaired" label="${tool.name} on ${readtype.fastq_r2_in.name} (R2 unpaired)" format_source="fastq_r2_in"> |
| 218 <filter>readtype['single_or_paired'] == "pair_of_files"</filter> | |
| 1 | 219 </data> |
| 7 | 220 <data name="fastq_out" label="${tool.name} on ${readtype.fastq_in.name}" format_source="fastq_in"> |
| 221 <filter>readtype['single_or_paired'] == 'se'</filter> | |
| 1 | 222 </data> |
|
8
a923b799c77c
Version 0.36.3: fix the naming of output collections to differentiate btwn paired/unpaired; document the _JAVA_OPTIONS env var (thanks Marius van den Beek).
pjbriggs
parents:
7
diff
changeset
|
223 <collection name="fastq_out_paired" type="paired" label="${tool.name} on ${on_string}: paired"> |
| 7 | 224 <filter>readtype['single_or_paired'] == "collection"</filter> |
| 225 <data name="forward" label="${tool.name} on ${readtype.fastq_pair.forward.name} (R1 paired)" format_source="fastq_pair['forward']"/> | |
| 226 <data name="reverse" label="${tool.name} on ${readtype.fastq_pair.reverse.name} (R2 paired)" format_source="fastq_pair['reverse']"/> | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
227 </collection> |
|
8
a923b799c77c
Version 0.36.3: fix the naming of output collections to differentiate btwn paired/unpaired; document the _JAVA_OPTIONS env var (thanks Marius van den Beek).
pjbriggs
parents:
7
diff
changeset
|
228 <collection name="fastq_out_unpaired" type="paired" label="${tool.name} on ${on_string}: unpaired"> |
| 7 | 229 <filter>readtype['single_or_paired'] == "collection"</filter> |
| 230 <data name="forward" label="${tool.name} on ${readtype.fastq_pair.forward.name} (R1 unpaired)" format_source="fastq_pair['forward']"/> | |
| 231 <data name="reverse" label="${tool.name} on ${readtype.fastq_pair.reverse.name} (R2 unpaired)" format_source="fastq_pair['reverse']"/> | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
232 </collection> |
| 12 | 233 <data name="log_file" format="txt" label="${tool.name} on ${on_string} (trimlog file)" from_work_dir="trimlog"> |
| 234 <filter>output_logs</filter> | |
| 235 </data> | |
| 236 <data name="err_file" format="txt" label="${tool.name} on ${on_string} (log file)" from_work_dir="trimmomatic.log"> | |
| 237 <filter>output_err</filter> | |
| 238 </data> | |
| 1 | 239 </outputs> |
| 240 <tests> | |
| 241 <test> | |
| 242 <!-- Single-end example --> | |
| 12 | 243 <conditional name="readtype"> |
| 244 <param name="single_or_paired" value="se" /> | |
| 245 <param name="fastq_in" value="Illumina_SG_R1.fastq" ftype="fastqsanger" /> | |
| 246 </conditional> | |
| 1 | 247 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> |
| 12 | 248 <param name="output_logs" value="yes" /> |
| 249 <param name="output_err" value="yes" /> | |
| 1 | 250 <output name="fastq_out" file="trimmomatic_se_out1.fastq" /> |
| 12 | 251 <output name="log_file" file="trimmomatic_se_out1.log" /> |
| 252 <output name="err_file" file="trimmomatic_se_out1.err" /> | |
| 1 | 253 </test> |
| 254 <test> | |
| 7 | 255 <!-- Single-end example - gzipped --> |
| 256 <param name="single_or_paired" value="se" /> | |
| 257 <param name="fastq_in" value="Illumina_SG_R1.fastq.gz" ftype="fastqsanger.gz" /> | |
| 258 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> | |
| 259 <output name="fastq_out" file="trimmomatic_se_out1.fastq.gz" /> | |
| 260 </test> | |
| 261 <test> | |
| 262 <!-- Paired-end example - gzipped --> | |
| 263 <param name="single_or_paired" value="pair_of_files" /> | |
| 264 <param name="fastq_r1_in" value="Illumina_SG_R1.fastq.gz" ftype="fastqsanger.gz" /> | |
| 265 <param name="fastq_r2_in" value="Illumina_SG_R2.fastq.gz" ftype="fastqsanger.gz" /> | |
| 266 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> | |
| 267 <output name="fastq_out_r1_paired" file="trimmomatic_pe_r1_paired_out1.fastq.gz" /> | |
| 268 <output name="fastq_out_r1_unpaired" file="trimmomatic_pe_r1_unpaired_out1.fastq.gz" /> | |
| 269 <output name="fastq_out_r2_paired" file="trimmomatic_pe_r2_paired_out1.fastq.gz" /> | |
| 270 <output name="fastq_out_r2_unpaired" file="trimmomatic_pe_r2_unpaired_out1.fastq.gz" /> | |
| 271 </test> | |
| 272 <test> | |
| 1 | 273 <!-- Paired-end example --> |
| 7 | 274 <param name="single_or_paired" value="pair_of_files" /> |
| 1 | 275 <param name="fastq_r1_in" value="Illumina_SG_R1.fastq" ftype="fastqsanger" /> |
| 276 <param name="fastq_r2_in" value="Illumina_SG_R2.fastq" ftype="fastqsanger" /> | |
| 277 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> | |
| 278 <output name="fastq_out_r1_paired" file="trimmomatic_pe_r1_paired_out1.fastq" /> | |
| 279 <output name="fastq_out_r1_unpaired" file="trimmomatic_pe_r1_unpaired_out1.fastq" /> | |
| 280 <output name="fastq_out_r2_paired" file="trimmomatic_pe_r2_paired_out1.fastq" /> | |
| 281 <output name="fastq_out_r2_unpaired" file="trimmomatic_pe_r2_unpaired_out1.fastq" /> | |
| 282 </test> | |
| 283 <test> | |
| 12 | 284 <!-- Paired-end Illumina 1.3-1.7 quality encoding --> |
| 285 <param name="single_or_paired" value="pair_of_files" /> | |
| 286 <param name="fastq_r1_in" value="Illumina_SG_R1.fastqillumina" ftype="fastqillumina" /> | |
| 287 <param name="fastq_r2_in" value="Illumina_SG_R2.fastqillumina" ftype="fastqillumina" /> | |
| 288 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> | |
| 289 <output name="fastq_out_r1_paired" file="trimmomatic_pe_r1_paired_out1.fastqillumina" /> | |
| 290 <output name="fastq_out_r1_unpaired" file="trimmomatic_pe_r1_unpaired_out1.fastqillumina" /> | |
| 291 <output name="fastq_out_r2_paired" file="trimmomatic_pe_r2_paired_out1.fastqillumina" /> | |
| 292 <output name="fastq_out_r2_unpaired" file="trimmomatic_pe_r2_unpaired_out1.fastqillumina" /> | |
| 293 </test> | |
| 294 <test> | |
| 295 <!-- Paired-end Solexa quality encoding --> | |
| 296 <param name="single_or_paired" value="pair_of_files" /> | |
| 297 <param name="fastq_r1_in" value="Illumina_SG_R1.fastqsolexa" ftype="fastqsolexa" /> | |
| 298 <param name="fastq_r2_in" value="Illumina_SG_R2.fastqsolexa" ftype="fastqsolexa" /> | |
| 299 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> | |
| 300 <output name="fastq_out_r1_paired" file="trimmomatic_pe_r1_paired_out1.fastqsolexa" /> | |
| 301 <output name="fastq_out_r1_unpaired" file="trimmomatic_pe_r1_unpaired_out1.fastqsolexa" /> | |
| 302 <output name="fastq_out_r2_paired" file="trimmomatic_pe_r2_paired_out1.fastqsolexa" /> | |
| 303 <output name="fastq_out_r2_unpaired" file="trimmomatic_pe_r2_unpaired_out1.fastqsolexa" /> | |
| 304 </test> | |
| 305 <test> | |
| 1 | 306 <!-- Single-end example (cropping) --> |
| 7 | 307 <param name="single_or_paired" value="se" /> |
| 1 | 308 <param name="fastq_in" value="Illumina_SG_R1.fastq" ftype="fastqsanger" /> |
| 309 <param name="operations_0|operation|name" value="CROP" /> | |
| 310 <param name="operations_0|operation|crop" value="10" /> | |
| 311 <output name="fastq_out" file="trimmomatic_se_out2.fastq" /> | |
| 312 </test> | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
313 <test> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
314 <!-- Paired-end with dataset collection --> |
| 7 | 315 <param name="single_or_paired" value="collection" /> |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
316 <param name="fastq_pair"> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
317 <collection type="paired"> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
318 <element name="forward" value="Illumina_SG_R1.fastq" ftype="fastqsanger" /> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
319 <element name="reverse" value="Illumina_SG_R2.fastq" ftype="fastqsanger"/> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
320 </collection> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
321 </param> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
322 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
323 <output_collection name="fastq_out_paired" type="paired"> |
| 7 | 324 <element name="forward" file="trimmomatic_pe_r1_paired_out1.fastq" /> |
| 325 <element name="reverse" file="trimmomatic_pe_r2_paired_out1.fastq" /> | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
326 </output_collection> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
327 <output_collection name="fastq_out_unpaired" type="paired"> |
| 7 | 328 <element name="forward" file="trimmomatic_pe_r1_unpaired_out1.fastq" /> |
| 329 <element name="reverse" file="trimmomatic_pe_r2_unpaired_out1.fastq" /> | |
| 330 </output_collection> | |
| 331 </test> | |
| 332 <test> | |
| 333 <!-- Paired-end with dataset collection - gzipped --> | |
| 334 <param name="single_or_paired" value="collection" /> | |
| 335 <param name="fastq_pair"> | |
| 336 <collection type="paired"> | |
| 337 <element name="forward" value="Illumina_SG_R1.fastq.gz" ftype="fastqsanger.gz" /> | |
| 338 <element name="reverse" value="Illumina_SG_R2.fastq.gz" ftype="fastqsanger.gz"/> | |
| 339 </collection> | |
| 340 </param> | |
| 341 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> | |
| 342 <output_collection name="fastq_out_paired" type="paired"> | |
| 343 <element name="forward" file="trimmomatic_pe_r1_paired_out1.fastq.gz" /> | |
| 344 <element name="reverse" file="trimmomatic_pe_r2_paired_out1.fastq.gz" /> | |
| 345 </output_collection> | |
| 346 <output_collection name="fastq_out_unpaired" type="paired"> | |
| 347 <element name="forward" file="trimmomatic_pe_r1_unpaired_out1.fastq.gz" /> | |
| 348 <element name="reverse" file="trimmomatic_pe_r2_unpaired_out1.fastq.gz" /> | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
349 </output_collection> |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
350 </test> |
| 4 | 351 <test> |
| 352 <!-- Single-end using AVGQUAL --> | |
| 7 | 353 <param name="single_or_paired" value="se" /> |
| 4 | 354 <param name="fastq_in" value="Illumina_SG_R1.fastq" ftype="fastqsanger" /> |
| 355 <param name="operations_0|operation|name" value="AVGQUAL" /> | |
| 356 <param name="operations_0|operation|avgqual" value="30" /> | |
| 357 <output name="fastq_out" file="trimmomatic_avgqual.fastq" /> | |
| 358 </test> | |
| 359 <test> | |
| 360 <!-- Single-end using MAXINFO --> | |
| 7 | 361 <param name="single_or_paired" value="se" /> |
| 4 | 362 <param name="fastq_in" value="Illumina_SG_R1.fastq" ftype="fastqsanger" /> |
| 363 <param name="operations_0|operation|name" value="MAXINFO" /> | |
| 364 <param name="operations_0|operation|target_length" value="75" /> | |
| 365 <param name="operations_0|operation|strictness" value="0.8" /> | |
| 366 <output name="fastq_out" file="trimmomatic_maxinfo.fastq" /> | |
| 367 </test> | |
| 9 | 368 <test> |
| 369 <!-- Paired-end ILLUMINACLIP - this does not check valid clipping --> | |
| 370 <param name="single_or_paired" value="pair_of_files" /> | |
| 371 <param name="fastq_r1_in" value="Illumina_SG_R1.fastq" ftype="fastqsanger" /> | |
| 372 <param name="fastq_r2_in" value="Illumina_SG_R2.fastq" ftype="fastqsanger" /> | |
| 373 <param name="do_illuminaclip" value="true"/> | |
| 374 <param name="adapter_fasta" value="TruSeq2-PE.fa"/> | |
| 375 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> | |
| 376 <output name="fastq_out_r1_paired" file="trimmomatic_pe_r1_paired_out1_clip.fastq" /> | |
| 377 <output name="fastq_out_r1_unpaired" file="trimmomatic_pe_r1_unpaired_out1.fastq" /> | |
| 378 <output name="fastq_out_r2_paired" file="trimmomatic_pe_r2_paired_out1.fastq" /> | |
| 379 <output name="fastq_out_r2_unpaired" file="trimmomatic_pe_r2_unpaired_out1_clip.fastq" /> | |
| 380 </test> | |
| 381 <test> | |
| 382 <!-- Paired-end ILLUMINACLIP providing 'custom' adapters - this does not check valid clipping --> | |
| 383 <param name="single_or_paired" value="pair_of_files" /> | |
| 384 <param name="fastq_r1_in" value="Illumina_SG_R1.fastq" ftype="fastqsanger" /> | |
| 385 <param name="fastq_r2_in" value="Illumina_SG_R2.fastq" ftype="fastqsanger" /> | |
| 386 <param name="do_illuminaclip" value="true"/> | |
| 387 <param name="standard_or_custom" value="custom"/> | |
| 388 <param name="adapter_text" | |
| 389 value=">PrefixPE/1 AATGATACGGCGACCACCGAGATCTACACTCTTTCCCTACACGACGCTCTTCCGATCT >PrefixPE/2 CAAGCAGAAGACGGCATACGAGATCGGTCTCGGCATTCCTGCTGAACCGCTCTTCCGATCT >PCR_Primer1 AATGATACGGCGACCACCGAGATCTACACTCTTTCCCTACACGACGCTCTTCCGATCT >PCR_Primer1_rc AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGTAGATCTCGGTGGTCGCCGTATCATT >PCR_Primer2 CAAGCAGAAGACGGCATACGAGATCGGTCTCGGCATTCCTGCTGAACCGCTCTTCCGATCT >PCR_Primer2_rc AGATCGGAAGAGCGGTTCAGCAGGAATGCCGAGACCGATCTCGTATGCCGTCTTCTGCTTG >FlowCell1 TTTTTTTTTTAATGATACGGCGACCACCGAGATCTACAC >FlowCell2 TTTTTTTTTTCAAGCAGAAGACGGCATACGA "/> | |
| 390 <param name="adapter_fasta" value="TruSeq2-PE.fa"/> | |
| 391 <param name="operations_0|operation|name" value="SLIDINGWINDOW" /> | |
| 392 <output name="fastq_out_r1_paired" file="trimmomatic_pe_r1_paired_out1_clip.fastq" /> | |
| 393 <output name="fastq_out_r1_unpaired" file="trimmomatic_pe_r1_unpaired_out1.fastq" /> | |
| 394 <output name="fastq_out_r2_paired" file="trimmomatic_pe_r2_paired_out1.fastq" /> | |
| 395 <output name="fastq_out_r2_unpaired" file="trimmomatic_pe_r2_unpaired_out1_clip.fastq" /> | |
| 396 </test> | |
| 1 | 397 </tests> |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
398 <help><![CDATA[ |
| 1 | 399 .. class:: infomark |
| 400 | |
| 401 **What it does** | |
| 402 | |
| 403 Trimmomatic performs a variety of useful trimming tasks for illumina paired-end and | |
| 404 single ended data. | |
| 405 | |
| 406 This tool allows the following trimming steps to be performed: | |
| 407 | |
| 408 * **ILLUMINACLIP:** Cut adapter and other illumina-specific sequences from the read | |
| 9 | 409 |
| 410 * If **Always keep both reads (PE specific/palindrome mode)** is True, the reverse read will also be retained in palindrome mode. | |
| 411 After read-though has been detected by palindrome mode, and the adapter sequence removed, | |
| 412 the reverse read contains the same sequence information as the forward read, albeit in reverse complement. | |
| 413 For this reason, the default behaviour is to entirely drop the reverse read. | |
| 414 Retaining the reverse read may be useful e.g. if the downstream tools cannot handle a combination of paired and unpaired reads. | |
| 1 | 415 * **SLIDINGWINDOW:** Perform a sliding window trimming, cutting once the average |
| 416 quality within the window falls below a threshold | |
| 417 * **MINLEN:** Drop the read if it is below a specified length | |
| 418 * **LEADING:** Cut bases off the start of a read, if below a threshold quality | |
| 419 * **TRAILING:** Cut bases off the end of a read, if below a threshold quality | |
| 420 * **CROP:** Cut the read to a specified length | |
| 421 * **HEADCROP:** Cut the specified number of bases from the start of the read | |
| 4 | 422 * **AVGQUAL:** Drop the read if the average quality is below a specified value |
| 7 | 423 * **MAXINFO:** Trim reads adaptively, balancing read length and error rate to |
| 4 | 424 maximise the value of each read |
| 1 | 425 |
| 426 If ILLUMINACLIP is requested then it is always performed first; subsequent options | |
| 427 can be mixed and matched and will be performed in the order that they have been | |
| 428 specified. | |
| 429 | |
| 430 .. class:: warningmark | |
| 431 | |
| 432 Note that trimming operation order is important. | |
| 433 | |
| 434 ------------- | |
| 435 | |
| 436 .. class:: infomark | |
| 437 | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
438 **Inputs** |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
439 |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
440 For single-end data this Trimmomatic tool accepts a single FASTQ file; for |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
441 paired-end data it will accept either two FASTQ files (R1 and R2), or a |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
442 dataset collection containing the R1/R2 FASTQ pair. |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
443 |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
444 .. class:: infomark |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
445 |
| 1 | 446 **Outputs** |
| 447 | |
| 448 For paired-end data a particular strength of Trimmomatic is that it retains the | |
| 449 pairing of reads (from R1 and R2) in the filtered output files: | |
| 450 | |
| 451 * Two FASTQ files (R1-paired and R2-paired) contain one read from each pair where | |
| 452 both have survived filtering. | |
| 453 * Additionally two FASTQ files (R1-unpaired and R2-unpaired) contain reads where | |
| 454 one of the pair failed the filtering steps. | |
| 455 | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
456 .. class:: warningmark |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
457 |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
458 If the input consists of a dataset collection with the R1/R2 FASTQ pair then |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
459 the outputs will also inclue two dataset collections: one for the 'paired' |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
460 outputs and one for the 'unpaired' (as described above) |
|
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
461 |
| 1 | 462 Retaining the same order and number of reads in the filtered output fastq files is |
| 463 essential for many downstream analysis tools. | |
| 464 | |
| 465 For single-end data the output is a single FASTQ file containing just the filtered | |
| 466 reads. | |
| 467 | |
| 468 ------------- | |
| 469 | |
| 470 .. class:: infomark | |
| 471 | |
| 472 **Credits** | |
| 473 | |
| 474 This Galaxy tool has been developed within the Bioinformatics Core Facility at the | |
| 9 | 475 University of Manchester, with contributions from Peter van Heusden, Marius |
| 12 | 476 van den Beek, Jelle Scholtalbers, Charles Girardot, and Matthias Bernt. |
| 7 | 477 |
| 478 It runs the Trimmomatic program which has been developed | |
| 1 | 479 within Bjorn Usadel's group at RWTH Aachen university. |
| 480 | |
| 481 Trimmomatic website (including documentation): | |
| 482 | |
| 7 | 483 * http://www.usadellab.org/cms/index.php?page=trimmomatic |
| 1 | 484 |
| 485 The reference for Trimmomatic is: | |
| 486 | |
| 487 * Bolger, A.M., Lohse, M., & Usadel, B. (2014). Trimmomatic: A flexible trimmer | |
| 488 for Illumina Sequence Data. Bioinformatics, btu170. | |
| 489 | |
| 490 Please kindly acknowledge both this Galaxy tool and the Trimmomatic program if you | |
| 491 use it. | |
|
3
a7139c612c45
Updated to version 0.32.3: add support for FASTQ pairs (dataset collections)
pjbriggs
parents:
2
diff
changeset
|
492 ]]></help> |
| 1 | 493 <citations> |
| 494 <!-- | |
| 495 See https://wiki.galaxyproject.org/Admin/Tools/ToolConfigSyntax#A.3Ccitations.3E_tag_set | |
| 496 Can be either DOI or Bibtex | |
| 497 Use http://www.bioinformatics.org/texmed/ to convert PubMed to Bibtex | |
| 498 --> | |
| 499 <citation type="doi">10.1093/bioinformatics/btu170</citation> | |
| 500 </citations> | |
| 501 </tool> |
