comparison split_libraries_fastq.xml @ 0:c1bd0c560018 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/qiime commit bcbe76277f3e60303faf826f8ce7f018bc663a9a-dirty
author bebatut
date Tue, 02 Feb 2016 05:50:37 -0500
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:c1bd0c560018
1 <tool id="split_libraries_fastq" name="Split fastq libraries" version="1.9.1">
2 <description>to performs demultiplexing of Fastq sequence data</description>
3
4 <macros>
5 <import>macros.xml</import>
6 </macros>
7
8 <expand macro="requirements" />
9
10 <version_command><![CDATA[
11 split_libraries_fastq.py --version
12 ]]>
13 </version_command>
14
15 <command><![CDATA[
16 split_libraries_fastq.py
17
18 #set $seq_files = ''
19 #set $sep = ''
20 #for $file in $input_fastq_files
21 #set $seq_files += $sep + str($file)
22 #set $sep = ','
23 #end for
24 -i $seq_files
25
26 -o split_libraries
27
28 #set $mapping_files = ''
29 #set $sep = ''
30 #for $file in $input_mapping_files
31 #set $mapping_files += $sep + str($file)
32 #set $sep = ','
33 #end for
34 -m $mapping_files
35
36 #set $barcode_files = ''
37 #set $sep = ''
38 #for $file in $input_files_barcode_read_fps
39 #set $barcode_files += $sep + str($file)
40 #set $sep = ','
41 #end for
42 -b $barcode_files
43
44 $store_qual_scores
45
46 #if str($sample_ids):
47 --sample_ids $sample_ids
48 #end if
49
50 $store_demultiplexed_fastq
51 $retain_unassigned_reads
52 -r $max_bad_run_length
53 -p $min_per_read_length_fraction
54 -n $sequence_max_n
55 -s $start_seq_id
56
57 $rev_comp_barcode
58 $rev_comp_mapping_barcodes
59 $rev_comp
60
61 -q $phred_quality_threshold
62
63 #if str( $barcode_type.barcode_selector ) != "custom_length"
64 --barcode_type $barcode_type.barcode_selector
65 #else
66 --barcode_type $barcode_type.barcode_length
67 #end if
68
69 --max_barcode_errors $max_barcode_errors
70
71 $phred_offset
72 ]]>
73 </command>
74
75 <inputs>
76 <param name="input_fastq_files" type="data"
77 format="fastq,fastqsanger,fastqsolexa"
78 label="Input fastq files" multiple="True" help="(-i/--sequence_read_fps)"/>
79
80 <param name="input_mapping_files" type="data"
81 format="txt,tabular,tsv,csv" label="Metadata mapping files (optional)"
82 multiple="True" optional="True" help="(-m/--mapping_fps)"/>
83
84 <param name="input_files_barcode_read_fps" type="data"
85 format="fastq,fastqsanger,fastqsolexa" label="Barcode read files (optional)"
86 multiple="True" optional="True" help="(-b/--barcode_read_fps)"/>
87
88 <param name="store_qual_scores" type="boolean" label="Store quality strings
89 in files?" truevalue="--store_qual_scores" falsevalue="" checked="False"
90 help="(--store_qual_scores)" />
91
92 <param name="sample_ids" type="text" label="Comma-separated list of samples
93 ids to be applied to all sequences (optional)" optional="True"
94 help="It must be one per input file path (used when data is not
95 multiplexed, --sample_ids)"/>
96
97 <param name="store_demultiplexed_fastq" type="boolean" label="Write
98 demultiplexed fastq files?" truevalue="--store_demultiplexed_fastq"
99 falsevalue="" checked="False" help="(--store_demultiplexed_fastq)" />
100
101 <param name="retain_unassigned_reads" type="boolean" label="Retain
102 sequences which don’t map to a barcode in the mapping file?"
103 truevalue="--retain_unassigned_reads" falsevalue="" checked="False"
104 help="Sample ID will be 'Unassigned' (--retain_unassigned_reads)" />
105
106 <param name="max_bad_run_length" type="integer" value="3"
107 label="Maximum number of consecutive low quality base calls allowed
108 before truncating a read" help="(-r/--max_bad_run_length)" />
109
110 <param name="min_per_read_length_fraction" type="float" value="0.75"
111 label="Minimum number of consecutive high quality base calls to
112 include a read (per single end read) as a fraction of the input read
113 length" help="(-p/--min_per_read_length_fraction)" />
114
115 <param name="sequence_max_n" type="integer" value="0"
116 label="Maximum number of N characters allowed in a sequence to retain
117 it" help="This is applied after quality trimming, and is total over
118 combined paired end reads if applicable (-n/--sequence_max_n)" />
119
120 <param name="start_seq_id" type="integer" value="0"
121 label="Start seq_ids as ascending integers beginning with start_seq_id"
122 help="(-s/--start_seq_id)" />
123
124 <param name="rev_comp_barcode" type="boolean" label="Reverse complement
125 barcode reads before lookup?" truevalue="--rev_comp_barcode"
126 falsevalue="" checked="False" help="(--rev_comp_barcode)" />
127
128 <param name="rev_comp_mapping_barcodes" type="boolean" label="Reverse
129 complement barcode in mapping before lookup?"
130 truevalue="--rev_comp_mapping_barcodes" falsevalue="" checked="False"
131 help="It is useful if barcodes in mapping file are reverse
132 complements of golay codes (--rev_comp_mapping_barcodes)" />
133
134 <param name="rev_comp" type="boolean" label="Reverse omplement sequence
135 before writing to output file?" truevalue="--rev_comp" falsevalue=""
136 checked="False" help="(--rev_comp)" />
137
138 <param name="phred_quality_threshold" type="integer" value="3"
139 label="Maximum unacceptable Phred quality score" help="E.g., for
140 Q20 and better, 19 must be specified (-q/--phred_quality_threshold)" />
141
142 <conditional name="barcode_type">
143 <param name="barcode_selector" type="select" label="Type of barcode"
144 help="(--barcode_type)">
145 <option value="hamming_8">hamming_8</option>
146 <option value="golay_12" selected="true">golay_12</option>
147 <option value="variable_length">variable_length (disable any barcode correction)</option>
148 <option value="custom_length">Custom length</option>
149 <option value="not-barcoded">Data not barcoded</option>
150 </param>
151 <when value="hamming_8" />
152 <when value="golay_12" />
153 <when value="variable_length" />
154 <when value="custom_length">
155 <param name="barcode_length" type="integer" value="4"
156 label="Barcode length"/>
157 </when>
158 <when value="not-barcoded" />
159 </conditional>
160
161 <param name="max_barcode_errors" type="float" value="1.5"
162 label="Maximum number of errors in barcode"
163 help="(--max_barcode_errors)" />
164
165 <param name="phred_offset" type="select" label="Ascii offset to use when
166 decoding phred scores" help="(--phred_offset)">
167 <option value="--phred_offset 33">33</option>
168 <option value="--phred_offset 64">64</option>
169 <option value="" selected="true">Automatically determined</option>
170 </param>
171 </inputs>
172
173 <outputs>
174 <data name="log" format="txt"
175 from_work_dir="split_libraries/split_library_log.txt"
176 label="${tool.name} on ${on_string}: log"/>
177 <data name="histograms" format="tabular"
178 from_work_dir="split_libraries/histograms.txt"
179 label="${tool.name} on ${on_string}: histograms"/>
180 <data name="seqs" format="fasta"
181 from_work_dir="split_libraries/seqs.fna"
182 label="${tool.name} on ${on_string}: sequences"/>
183 <data name="seqs_qual" format="qual"
184 from_work_dir="split_libraries/seqs.qual"
185 label="${tool.name} on ${on_string}: sequence qualities">
186 <filter>store_qual_scores is True</filter>
187 </data>
188 <data name="seqs_fastq" format="fastq"
189 from_work_dir="split_libraries/seqs.fastq"
190 label="${tool.name} on ${on_string}: demultiplexed sequences (fastq)">
191 <filter>store_demultiplexed_fastq is True</filter>
192 </data>
193 </outputs>
194
195 <tests>
196 <test>
197 <param name="input_fastq_files" value="forward_reads.fastq"/>
198 <param name="input_mapping_files" value="map.tsv"/>
199 <param name="input_files_barcode_read_fps" value="barcodes.fastq"/>
200 <param name="store_qual_scores" value="--store_qual_scores" />
201 <param name="store_demultiplexed_fastq" value="--store_demultiplexed_fastq" />
202 <param name="retain_unassigned_reads" value=""/>
203 <param name="max_bad_run_length" value="3"/>
204 <param name="min_per_read_length_fraction" value="0.75"/>
205 <param name="sequence_max_n" value="0"/>
206 <param name="start_seq_id" value="0" />
207 <param name="rev_comp_barcode" value="" />
208 <param name="rev_comp_mapping_barcodes" value="" />
209 <param name="rev_comp" value="" />
210 <param name="start_seq_id" value="3"/>
211 <param name="barcode_selector" value="golay_12"/>
212 <param name="max_barcode_errors" value="1.5"/>
213 <param name="phred_offset" value="" />
214
215 <output name="log" file="split_fastq_libraries_log.txt"/>
216 <output name="seqs" file="split_fastq_libraries_sequences.fasta"/>
217 <output name="histograms" file="split_fastq_libraries_histograms.tabular"/>
218 <output name="histograms" file="split_fastq_libraries_histograms.tabular"/>
219 <output name="seqs_qual" file="split_fastq_libraries_sequence_qualities.qual"/>
220 <output name="seqs_fastq" file="split_fastq_libraries_demultiplexed_sequences.fastq"/>
221 </test>
222 </tests>
223
224 <help><![CDATA[
225
226 **What it does**
227
228 This tool performs demultiplexing of Fastq sequence data where barcodes and sequences are contained in two separate fastq files (common on Illumina runs).
229
230 More information about this tool is available on
231 `QIIME documentation <http://qiime.org/scripts/split_libraries_fastq.html>`_.
232 ]]>
233 </help>
234
235 <citations>
236 <expand macro="citations" />
237 </citations>
238
239 </tool>